diff --git a/.htaccess b/.htaccess
new file mode 100644
index 00000000..58eeb9f2
--- /dev/null
+++ b/.htaccess
@@ -0,0 +1,16 @@
+<IfModule mod_deflate.c>
+AddOutputFilterByType DEFLATE text/plain
+AddOutputFilterByType DEFLATE text/html
+AddOutputFilterByType DEFLATE text/xml
+AddOutputFilterByType DEFLATE text/css
+AddOutputFilterByType DEFLATE application/xml
+AddOutputFilterByType DEFLATE application/xhtml+xml
+AddOutputFilterByType DEFLATE application/rss+xml
+AddOutputFilterByType DEFLATE application/javascript
+AddOutputFilterByType DEFLATE application/x-javascript
+AddOutputFilterByType DEFLATE image/jpg
+AddOutputFilterByType DEFLATE image/png
+AddOutputFilterByType DEFLATE image/gif
+AddOutputFilterByType DEFLATE image/jpeg
+AddOutputFilterByType DEFLATE image/svg+xml
+</IfModule>
\ No newline at end of file
diff --git a/CNAME b/CNAME
new file mode 100644
index 00000000..505ea8a1
--- /dev/null
+++ b/CNAME
@@ -0,0 +1 @@
+ldbcouncil.org
diff --git a/README.md b/README.md
new file mode 100644
index 00000000..eb54e506
--- /dev/null
+++ b/README.md
@@ -0,0 +1 @@
+This repository is built based on the source at <https://github.com/ldbc/ldbc.github.io-internal/> (private repository).
diff --git a/becoming-a-member/index.html b/becoming-a-member/index.html
new file mode 100644
index 00000000..f6b51213
--- /dev/null
+++ b/becoming-a-member/index.html
@@ -0,0 +1,381 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Becoming a Member</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Becoming a Member</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Becoming a Member</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <h3 id="benefits">Benefits</h3>
+<p>The benefits of <a href="/organizational-members">LDBC membership</a> are:</p>
+<ul>
+<li>Access to the internal LDBC information via its project management system and mailing lists, which include access to discussion documents, datasets, and draft benchmark specifications.</li>
+<li>Access to research resources at academic partners and connections to industry members.</li>
+<li>Right to membership of LDBC task forces and working groups. Currently, there are task forces on the Social Network Benchmark, Graphalytics, and FinBench, and working groups on graph schemas and query languages.</li>
+<li>Right to commission LDBC audits to produce official LDBC benchmark results.</li>
+</ul>
+<p><em>Note:</em> Apart from conformance to membership agreement, including the <a href="constitutional-documents">Byelaws</a> and the <a href="benchmarks/fair-use-policies">Fair Use Policy</a>, becoming an LDBC member does not involve any further obligations. Members are not required to attend meetings, travel to events, or be involved in any task forces/working groups.</p>
+<h4 id="annual-membership-fees">Annual membership fees</h4>
+<ul>
+<li>Sponsor company/institution: 8,800 GBP</li>
+<li>Commercial company: 2,200 GBP</li>
+<li>Non-commercial institution: 1,100 GBP</li>
+<li>Individual Voting member (standard rate): 165 GBP</li>
+<li>Individual Voting member (reduced rate for students, etc.): 10 GBP</li>
+<li>Individual Associate member: no subscription fee</li>
+</ul>
+<p><em>Note:</em> For non-sponsor organizations, there is a 2,000 GBP auditing fee, to be paid for each audit to LDBC. Sponsors are exempt from this additional fee.</p>
+<h3 id="forms">Forms</h3>
+<p>For the latest information on becoming an LDBC member, see the <a href="/docs/LDBC.Membership--Joining.and.Renewing.(August.2023).pdf">LDBC Membership – Joining and Renewing 2023</a> document.</p>
+<p>Please fill out this form if you are an organization or individual applying to join LDBC:</p>
+<ul>
+<li><a href="/docs/LDBC.Membership.Application_Renewal.Form.and.incorporated.Membership.Agreement.(August.2023).pdf">Membership form</a> (both for individuals and organizations)</li>
+</ul>
+<p>Fill out one of these forms if you are just contributing to a project in the <a href="https://github.com/ldbc">LDBC GitHub organization</a></p>
+<ul>
+<li><a href="/docs/LDBC.Individual.Contributor.License.Agreement.Form-2020-10-23.pdf">Individual contributor license agreement (CLA)</a></li>
+<li><a href="/docs/LDBC.Organization.Contributor.License.Agreement.Form-2020-10-23.pdf">Organization contributor license agreement (CLA)</a></li>
+</ul>
+<p>In either case please email your completed form to <code>info@ldbcouncil.org</code></p>
+<h3 id="constitutional-documents">Constitutional documents</h3>
+<p>See the <a href="/constitutional-documents">constitutional documents</a> page.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmark-finbench/index.html b/benchmark-finbench/index.html
new file mode 100644
index 00000000..588fa8b8
--- /dev/null
+++ b/benchmark-finbench/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/finbench/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/finbench/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/finbench/">
+  </head>
+</html>
diff --git a/benchmark-graphalytics/index.html b/benchmark-graphalytics/index.html
new file mode 100644
index 00000000..66b5ac71
--- /dev/null
+++ b/benchmark-graphalytics/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/graphalytics/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/graphalytics/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/graphalytics/">
+  </head>
+</html>
diff --git a/benchmark-snb/index.html b/benchmark-snb/index.html
new file mode 100644
index 00000000..722eb105
--- /dev/null
+++ b/benchmark-snb/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/snb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/snb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/snb/">
+  </head>
+</html>
diff --git a/benchmark-spb/index.html b/benchmark-spb/index.html
new file mode 100644
index 00000000..b1746b28
--- /dev/null
+++ b/benchmark-spb/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/spb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/spb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/spb/">
+  </head>
+</html>
diff --git a/benchmarks/fair-use-policies/index.html b/benchmarks/fair-use-policies/index.html
new file mode 100644
index 00000000..27f98c66
--- /dev/null
+++ b/benchmarks/fair-use-policies/index.html
@@ -0,0 +1,422 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fair Use Policy for LDBC Benchmarks®</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Fair Use Policy for LDBC Benchmarks®</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Fair Use Policy for LDBC Benchmarks®</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <style>
+.content ol {
+    counter-reset: list;
+    padding-left: 0px;
+    margin-top: 10px;
+}
+.content ol ol {
+    margin-left: 20px;
+}
+.content ol li {
+    padding-left: 0px;
+    margin-left: 0px;
+}
+.content ol li:before {
+    all: unset;
+}
+.content ol > li {
+    list-style: none;
+}
+.content ol > li:before {
+    content: counter(list, lower-alpha) ") ";
+    counter-increment: list;
+}
+blockquote {
+    padding-top: 20px;
+}
+blockquote:before {
+    all: unset;
+}
+</style>
+<p>The text of this page is based on our <a href="">Byelaws</a>.</p>
+<h2 id="ldbc-benchmarks-and-ldbc-benchmark-results">LDBC Benchmarks® and LDBC Benchmark® Results</h2>
+<p>LDBC expects all its members to conscientiously observe the provisions of this Fair Use Policy for LDBC Benchmarks.  LDBC-approved auditors must bring this Fair Use Policy for LDBC Benchmarks to the attention of any prospective or actual Test Sponsor. The Board of Directors of LDBC is responsible for enforcing this Policy and any alleged violations should be notified to <code>info@ldbcouncil.org</code>.</p>
+<ol>
+<li>An “LDBC Draft Benchmark®” is a benchmark specification and any associated tooling or datasets, which has been written by an LDBC Task Force or Working Group whose charter includes the goal of achieving adoption of that specification as an LDBC standard, in accordance with Article 33 of the Articles of Association of the Company, “Approval of Standards”.</li>
+<li>An “LDBC Benchmark®” is an LDBC Draft Benchmark once it has been adopted as an LDBC standard.</li>
+<li>A result of a performance test can be fairly described as an “LDBC Benchmark Result”, if the test&mdash;which may be executed in several runs all of which use the same System Under Test (SUT)&mdash;has been successfully audited by an LDBC-approved auditor, and the result is reported as part of an LDBC Benchmark Results set, so it can be interpreted in context.</li>
+<li>An audit can only be successful if the audited test
+<ol>
+<li>uses a SUT which faithfully implements the mandatory features and chosen optional features of an LDBC Benchmark ,</li>
+<li>completely exercises and generates results for all the mandatory requirements and chosen optional requirements of the LDBC Benchmark, and</li>
+<li>is conducted and audited in conformance with all the relevant provisions of the LDBC Byelaws, including the statement of Total Cost of Ownership for the SUT and the reporting of price/performance metrics, such that the reported results can legitimately be used to compare the price-weighted performance of two SUTs.</li>
+</ol>
+</li>
+<li>“LDBC Benchmark Results” is a set of all the results of a successfully audited test. A single LDBC Benchmark Result must be reported as part of such a set.</li>
+<li>Any description or depiction of a specification that states or implies that it is an LDBC Draft Benchmark or an LDBC Benchmark when that is not the case is an infringement of LDBC’s trademark in the term “LDBC BENCHMARK”, which is registered in several major jurisdictions.</li>
+<li>The same trademark is infringed by any software which is described or promoted as being an implementation of an LDBC Draft Benchmark or LDBC Benchmark, but which does not faithfully implement the features of or does not support the mandatory requirements of the stated specification.</li>
+<li>The same trademark is infringed by any report or description of one or more performance test results which are not part of set of LDBC Benchmark Results, or in any other way states or implies that the results are endorsed by or originates from LDBC.</li>
+<li>LDBC considers the use of that trademarked term with respect to performance test results solely in accordance with these Byelaws to be essential to the purpose and reputation of the Company and its benchmark standards.</li>
+</ol>
+<h2 id="reporting-of-ldbc-benchmark-results">Reporting of LDBC Benchmark Results</h2>
+<p>Once an auditor has approved a performance test result, including all required supporting documentation, as being successfully audited, then the Members Council and the Task Force responsible for the benchmark will be notified. The Board will have the results added to the LDBC web site as an LDBC Benchmark Results set according to the following procedure:</p>
+<ol>
+<li>LDBC members will receive notification of the result via email to their designated contacts within five business days of LDBC receiving the notification.</li>
+<li>Within five business days of this notice, the LDBC administrator will post the result on the LDBC web site under the rubric &ldquo;LDBC Benchmark Results” unless the result is withdrawn by the Test Sponsor in the meantime.</li>
+<li>A result may be challenged and subsequently be withdrawn by the LDBC following a review process as described in Article 7.6.</li>
+<li>A result that is not challenged within 60 days of its publication will be automatically considered valid and may not be challenged after this time, and this fact will be recorded as part of the website posting of the result.</li>
+</ol>
+<h2 id="fair-use-of-the-trademark-ldbc-benchmark">Fair Use of the trademark LDBC BENCHMARK</h2>
+<p>Any party wishing to avoid infringement of the trademarked term “LDBC BENCHMARK” should follow the following guidelines relating to its fair use.</p>
+<p>LDBC encourages use, derived use, study, descriptions, critiques of and suggestions for improvement of LDBC Draft Benchmarks and LDBC Benchmarks. Our benchmark specifications are open-source, and we always welcome new contributors and members. These guidelines are only intended to prevent false or confusing claims relating to performance test results that are intended to be used for product comparisons.</p>
+<ol>
+<li>If your work is derived from an LDBC Draft or standard Benchmark, or is a partial implementation, or if you are using part of one of our standards for a non-benchmarking purpose, then we would expect you to give attribution, in line with our Creative Commons CC-BY 4.0 licence.</li>
+<li>We would also suggest that you make a statement, somewhere, somehow, that includes one of these phrases “This is not an LDBC Benchmark”, “This is not an implementation of an LDBC Benchmark” or “These are not LDBC Benchmark Results”.</li>
+<li>We would also suggest that you explain, however briefly, how your work is related to LDBC standards and how it varies from them.</li>
+</ol>
+<p>An example that illustrates these points: you might say something like this in a presentation:</p>
+<blockquote>
+<p>“We used the LDBC SNB benchmark as a starting point. This isn’t the official LDBC standard: we added four queries because of X, and we don’t attempt to deal with the ACID requirement. The test results aren’t audited, so we want to be clear that this is not an LDBC Benchmark test run, and these numbers are not LDBC Benchmark Results. If you look at this link on the slide I’m showing you can see all the details of how our work is derived from, and varies from, the SNB 2.0 spec.”</p>
+</blockquote>
+<p>Or you might say:</p>
+<blockquote>
+<p>“For this example of a GQL graph type we used the LDBC SNB data model. This is nothing to do with the actual LDBC benchmark specification: we just used their data model as a use-case for illustrating what a graph schema might look like. We took this from the SNB 2.0 spec.”</p>
+</blockquote>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/finbench/finbench-talk-16th-tuc.pdf b/benchmarks/finbench/finbench-talk-16th-tuc.pdf
new file mode 100644
index 00000000..69d3b523
Binary files /dev/null and b/benchmarks/finbench/finbench-talk-16th-tuc.pdf differ
diff --git a/benchmarks/finbench/index.html b/benchmarks/finbench/index.html
new file mode 100644
index 00000000..0a61bb13
--- /dev/null
+++ b/benchmarks/finbench/index.html
@@ -0,0 +1,360 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Financial Benchmark (LDBC FinBench)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Financial Benchmark (LDBC FinBench)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Financial Benchmark (LDBC FinBench)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as<br>
+anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>.</p>
+<p>The benchmark has one workload, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph. Its data sets are available in the <a href="https://drive.google.com/drive/folders/1NIAo4KptskBytbXoOqmF3Sto4hTX3JIH">Google Drive</a>.</p>
+<p>For a brief overview, see the <a href="/benchmarks/finbench/finbench-talk-16th-tuc.pdf">slides</a> presented in the 16th TUC meeting. The <a href="https://arxiv.org/pdf/2306.15975.pdf">Financial Benchmark&rsquo;s specification</a> can be found on arXiv.</p>
+<h2 id="finbench-audit">FinBench Audit</h2>
+<h3 id="audit-results">Audit results</h3>
+<p>There are no audited results yet.</p>
+<h3 id="commissioning-audits">Commissioning audits</h3>
+<p>For auditing requests, please reach out at <code>info@ldbcouncil.org</code>. Audits can only be commissioned by LDBC member companies by contracting any of the LDBC-certified auditors. Note that there is a 2,000 GBP auditing fee to be paid for the LDBC for non-sponsor company members. Sponsor companies are exempt from this.</p>
+<h3 id="use-of-audited-results">Use of audited results</h3>
+<h4 id="fair-use-policies">Fair use policies</h4>
+<p>The LDBC Social Network Benchmark is subject to the <a href="/benchmarks/fair-use-policies">LDBC Fair Use Policies</a>.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/finbench/ldbc-finbench-work-charter.pdf b/benchmarks/finbench/ldbc-finbench-work-charter.pdf
new file mode 100644
index 00000000..53bdc5f2
Binary files /dev/null and b/benchmarks/finbench/ldbc-finbench-work-charter.pdf differ
diff --git a/benchmarks/graphalytics/datagen-9_4-fb.md5 b/benchmarks/graphalytics/datagen-9_4-fb.md5
new file mode 100644
index 00000000..7d073131
--- /dev/null
+++ b/benchmarks/graphalytics/datagen-9_4-fb.md5
@@ -0,0 +1,9 @@
+38e45cc2157d9ac58aa9b71d88eda597  datagen-9_4-fb-BFS
+d92295cd9f3266cd60317be5498a6bb3  datagen-9_4-fb-CDLP
+a4a2ec19074dfb8035ba23906b42022e  datagen-9_4-fb-LCC
+efee23b3046a519fca7eaccb2d25c83b  datagen-9_4-fb-PR
+0aac4961401679a4677e34464d289a98  datagen-9_4-fb-SSSP
+3f0ee48788fb67b7dbfb91f5e9281df8  datagen-9_4-fb-WCC
+e27ac41236b43105ec2dc637d9c18f13  datagen-9_4-fb.v
+ea88ce7eb69fb8bd04d9675c6063db89  datagen-9_4-fb.e
+fee5726a16c9be80e461578aa0de31ec  datagen-9_4-fb.properties
diff --git a/benchmarks/graphalytics/datagen-sf10k-fb.md5 b/benchmarks/graphalytics/datagen-sf10k-fb.md5
new file mode 100644
index 00000000..a73413fa
--- /dev/null
+++ b/benchmarks/graphalytics/datagen-sf10k-fb.md5
@@ -0,0 +1,9 @@
+0e0ae322ed19be5b9e27ba3747e80dc7  datagen-sf10k-fb-BFS
+18a9a1e0841ed95d8102acf7a1c6f07a  datagen-sf10k-fb-CDLP
+f4a40d8c28df120ddcf99ee1cce63d8a  datagen-sf10k-fb-LCC
+916fc2a7441b3f91c1b55b9e31343746  datagen-sf10k-fb-PR
+fea3e750b4dd4778e92d8ba8f5fd851c  datagen-sf10k-fb-SSSP
+8492393a263a97ca7699e4ae305cd6d4  datagen-sf10k-fb-WCC
+e0f44f491673601c972e0b6cc1956210  datagen-sf10k-fb.v
+f51b3b2b0be31450df064d5dc93afa70  datagen-sf10k-fb.e
+8e4899461fe0e600f506949847fd9350  datagen-sf10k-fb.properties
diff --git a/benchmarks/graphalytics/datagen-sf3k-fb.md5 b/benchmarks/graphalytics/datagen-sf3k-fb.md5
new file mode 100644
index 00000000..b54434a0
--- /dev/null
+++ b/benchmarks/graphalytics/datagen-sf3k-fb.md5
@@ -0,0 +1,9 @@
+61dcb2aa6d9d7bc0bf2371c05fa301fb  datagen-sf3k-fb-BFS
+ee421e17f579c4ee56a4cca9464af028  datagen-sf3k-fb-CDLP
+b3ef2af6288a0d90d575f4af8f8bb37f  datagen-sf3k-fb-LCC
+2bbb3f2f19945ecda2b1bcb34e328aa1  datagen-sf3k-fb-PR
+a22e3c363f42f3ad676669eef2cc5bf9  datagen-sf3k-fb-SSSP
+44fc01388f60820e7853de521453bc8f  datagen-sf3k-fb-WCC
+201c44c0a285602ed8974d45fa27bfdb  datagen-sf3k-fb.v
+8cee484579faf5e21e6204af1d6b22c5  datagen-sf3k-fb.e
+56beff84261ccfdc86c383c87e43b4c2  datagen-sf3k-fb.properties
diff --git a/benchmarks/graphalytics/graph500-27.md5 b/benchmarks/graphalytics/graph500-27.md5
new file mode 100644
index 00000000..aa104a98
--- /dev/null
+++ b/benchmarks/graphalytics/graph500-27.md5
@@ -0,0 +1,8 @@
+a74369ca68d96540b7a7ad32c5330e18  graph500-27-BFS
+0b669d439a6d8720bc76b5ad5dce316b  graph500-27-CDLP
+039164e31cbcb906ba2d24a95206de33  graph500-27-LCC
+c10cd1fd0073d1d8c6129b44493b1a6e  graph500-27-PR
+e06a58c914d8777a7af4edfb49418b7e  graph500-27-WCC
+11e30e0644e0664c36d94f1eb6dc1dfe  graph500-27.v
+578778aa5e034661e8fd09028ecce363  graph500-27.e
+ef4abdd11d081f551ad4932a907b5d01  graph500-27.properties
diff --git a/benchmarks/graphalytics/graph500-28.md5 b/benchmarks/graphalytics/graph500-28.md5
new file mode 100644
index 00000000..2305a59d
--- /dev/null
+++ b/benchmarks/graphalytics/graph500-28.md5
@@ -0,0 +1,8 @@
+45dff47cbec77ce77ae2c80f1e64e97a  graph500-28-BFS
+0aa6a52bbe45e0b2f97581043e14b8fb  graph500-28-CDLP
+5212bb51a7c285e994feb297358c74b0  graph500-28-LCC
+32837223b988a2eb03b82b8f1bed224b  graph500-28-PR
+c71e6963a1cff7b4392d3d6e9bc2d2e1  graph500-28-WCC
+a25fb88d220fde0bffddb60b75237d6e  graph500-28.v
+02ee07342d20ec3ea850f576b473bb00  graph500-28.e
+9bd2866bf0c26e8dbe52ece1c7da839a  graph500-28.properties
diff --git a/benchmarks/graphalytics/graph500-29.md5 b/benchmarks/graphalytics/graph500-29.md5
new file mode 100644
index 00000000..761e8dc8
--- /dev/null
+++ b/benchmarks/graphalytics/graph500-29.md5
@@ -0,0 +1,8 @@
+a79d313775b1afd6e6dad4c1c5f131c1  graph500-29-BFS
+94c6b8ac82664973e5f9d4d3dd8292f8  graph500-29-CDLP
+5afc9b0bf64d8bd572df54cada249ae4  graph500-29-LCC
+e0eb05a8dbea49d53dee18306cd53641  graph500-29-PR
+b3f423edac470ced445a8c715ca09942  graph500-29-WCC
+b44e047d7aa80b818a4187574a1a5797  graph500-29.v
+100cd63d096f228d5b7c9aa1a71a9a85  graph500-29.e
+49d4023cdc452de105fef23c88dceae4  graph500-29.properties
diff --git a/benchmarks/graphalytics/graph500-30.md5 b/benchmarks/graphalytics/graph500-30.md5
new file mode 100644
index 00000000..dfb5e5cd
--- /dev/null
+++ b/benchmarks/graphalytics/graph500-30.md5
@@ -0,0 +1,8 @@
+3fd0f5ea5b6f25d82f099f7a0042f9c4  graph500-30-BFS
+84b4634fd584babdc3e1494a6417b240  graph500-30-CDLP
+89e70b27420916231a830abfd15f8537  graph500-30-LCC
+317b3e7da73f501389dcd2c19603a226  graph500-30-PR
+c33d8e13d8f84426757816e8ef792a9f  graph500-30-WCC
+004e13a22aba4c4cf94fc1ea3a460e6f  graph500-30.v
+3df72be3b189ba9c0c8b6c1f3762eda9  graph500-30.e
+bf352710c02f5baea96f63b4e64738ef  graph500-30.properties
diff --git a/benchmarks/graphalytics/index.html b/benchmarks/graphalytics/index.html
new file mode 100644
index 00000000..8111226c
--- /dev/null
+++ b/benchmarks/graphalytics/index.html
@@ -0,0 +1,845 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Graphalytics Benchmark (LDBC Graphalytics)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Graphalytics Benchmark (LDBC Graphalytics)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Graphalytics Benchmark (LDBC Graphalytics)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>The Graphalytics benchmark is an industrial-grade benchmark for <strong>graph analysis platforms</strong> such as Giraph, Spark GraphX, and GraphBLAS. It consists of six core algorithms, standard data sets, and reference outputs, enabling the objective comparison of graph analysis platforms.</p>
+<p>The benchmark harness consists of a core component, which is extendable by a driver for each different platform implementation. The benchmark includes the following algorithms:</p>
+<ol>
+<li>breadth-first search (BFS)</li>
+<li>PageRank (PR)</li>
+<li>weakly connected components (WCC)</li>
+<li>community detection using label propagation (CDLP)</li>
+<li>local clustering coefficient (LCC)</li>
+<li>single-source shortest paths (SSSP)</li>
+</ol>
+<p>The choice of these algorithms was carefully motivated, using the LDBC TUC and extensive literature surveys to ensure good coverage of scenarios. The standard data sets include both real and synthetic data sets, which are classified into intuitive “T-shirt” sizes (S, M, L, etc.).</p>
+<p>Each experiment set in Graphalytics consists of <strong>multiple platform runs</strong> (a platform executes an algorithm on a data set), and diverse set of experiments are carried out to evaluate different performance characteristics of a system-under-test.</p>
+<p>All completed benchmarks must go through a strict <strong>validation process</strong> to ensure the integrity of the performance results.</p>
+<p>The development of Graphalytics is supported by many active vendors in the field of large-scale graph analytics. Currently, Graphalytics already facilitates benchmarks for a large number of graph analytics platforms, such as GraphBLAS, Giraph, GraphX, and PGX.D, allowing comparison of the state-of-the-art system performance of both community-driven and industrial-driven platforms. To get started, the details of the Graphalyics documentation and its software components are described below.</p>
+<h2 id="documents-and-repositories">Documents and repositories</h2>
+<ul>
+<li><a href="https://arxiv.org/pdf/2011.15028.pdf">Benchmark specification</a>. The source code is stored in the <a href="https://github.com/ldbc/ldbc_graphalytics_docs"><code>ldbc_graphalytics_docs</code></a> repository</li>
+<li><a href="http://www.vldb.org/pvldb/vol9/p1317-iosup.pdf">VLDB paper</a></li>
+<li><a href="https://github.com/ldbc/ldbc_graphalytics"><code>ldbc_graphalytics</code></a>: Generic driver</li>
+<li><a href="https://github.com/ldbc/ldbc_graphalytics_platforms_umbra"><code>ldbc_graphalytics_platforms_umbra</code></a>: Umbra implementation</li>
+<li><a href="https://github.com/ldbc/ldbc_graphalytics_platforms_graphblas"><code>ldbc_graphalytics_platforms_graphblas</code></a>: GraphBLAS implementation</li>
+</ul>
+<h2 id="graphalytics-competition-2023">Graphalytics competition 2023</h2>
+<p>In 2023, we will hold a new round of the Graphalytics competition. See the <a href="https://docs.google.com/presentation/d/13MwAkn6UDMVI80DGdgErDyRbGkxbkpIb3N1oj5znjyc/edit">LDBC Graphalytics Benchmark presentation</a> for an introduction to the benchmark framework and the competition&rsquo;s rules.</p>
+<p>Artifacts:</p>
+<ul>
+<li><a href="https://github.com/ldbc/ldbc_graphalytics">benchmark framework</a></li>
+<li><a href="https://github.com/ldbc?q=graphalytics">reference implementations</a></li>
+<li>data sets (data sets and expected results) are available on GitHub</li>
+</ul>
+<h3 id="rules">Rules</h3>
+<ul>
+<li>Participation is free.</li>
+<li>There are no monetary prizes.</li>
+<li>Single-node and distributed implementations are allowed.</li>
+<li>Partial implementations (e.g. just small to mid-sized data sets and only a few algorithms) are allowed.</li>
+<li>Submissions should execute each algorithm-data set combination <strong>three times</strong>. From these, the <strong>arithmetic mean of the processing times</strong> is used for ranking.</li>
+<li>The results of the competition will be published on the LDBC website in the form of leaderboards, which rank them based on performance and price-performance (adjusted for the system price).</li>
+<li>There is a global leaderboard that includes all algorithms and scale factors. Additionally, there is a separate leaderboard for each scale (S, M, L, XL, 2XL+), algorithm and system category (CPU-based/GPU-based, single-node vs. distributed) to for fine-grained comparison.</li>
+<li>Submissions are subject to code review and reproducibility attempts from the organizers.</li>
+<li>System prices should be reported following the <a href="http://www.tpc.org/tpc_documents_current_versions/pdf/pricing_v2.8.0.pdf">TPC Pricing specification</a>.</li>
+</ul>
+<h3 id="recommendations-for-submissions">Recommendations for submissions</h3>
+<ul>
+<li>Submissions using modern hardware are welcome (GPUs, FPGAs, etc.).</li>
+<li>We encourage the use of cloud compute instances for running the benchmark (if possible).</li>
+</ul>
+<h3 id="important-dates">Important dates</h3>
+<ul>
+<li><strong>March 17:</strong> Competition is announced</li>
+<li><strong>April 25:</strong> Confirmation of intent</li>
+<li><strong>May    1:</strong> Submissions open</li>
+<li><strong>June  25:</strong> Submissions close</li>
+</ul>
+<h2 id="data-sets">Data sets</h2>
+<p>The Graphalytics data sets are compressed using <a href="https://github.com/facebook/zstd"><code>zstd</code></a>. The total size of the compressed archives is approx. 350GB. When decompressed, the data sets require approximately 1.5TB of disk space.</p>
+<p>For detailed information on the data sets, see the <a href="https://docs.google.com/spreadsheets/d/e/2PACX-1vQmFsORNp8OhemIpbAXODkhly2XRkhUuIUTvUv9oHJSgCKQaNNiPFGmHfWPswG3NTUbitAc9nJ3ztRx/pubhtml?gid=1975005458&amp;single=true">table with their statistics</a>.</p>
+<p>The data sets are available in two locations:</p>
+<ul>
+<li>A public Cloudflare R2 bucket
+<ul>
+<li>This is the primary source for the data sets and is kept up-to-date upon changes</li>
+<li>The links in the table below point to this bucket</li>
+<li><a href="/scripts/download-graphalytics-data-sets-r2.sh">Shell script to download the data sets from Cloudflare R2</a></li>
+<li>Download scripts for individual sizes: <a href="/scripts/download-graphalytics-data-sets-r2-test.sh">test graphs</a>, <a href="/scripts/download-graphalytics-data-sets-r2-s.sh">sizes up to S</a>, <a href="/scripts/download-graphalytics-data-sets-r2-m.sh">size M</a>, <a href="/scripts/download-graphalytics-data-sets-r2-l.sh">size L</a>, <a href="/scripts/download-graphalytics-data-sets-r2-xl.sh">size XL</a>, <a href="/scripts/download-graphalytics-data-sets-r2-2xl.sh">sizes 2XL+</a></li>
+</ul>
+</li>
+<li><a href="https://ldbcouncil.org/data-sets-surf-repository/graphalytics.html">CWI/SURFsara data repository</a>
+<ul>
+<li>Backup repository</li>
+<li><a href="/scripts/download-graphalytics-data-sets-surfsara.sh">Shell script to download the data sets from SURFsara</a></li>
+</ul>
+</li>
+</ul>
+<p>Note that some of the Graphalytics data sets were fixed in March 2023. Prior to this, they were incorrectly packaged or had missing/incorrect reference outputs for certain algorithms. If you are uncertain whether you have the correct versions, cross-check them against these MD5 checksums: <a href="/benchmarks/graphalytics/datagen-9_4-fb.md5"><code>datagen-9_4-fb</code></a>, <a href="/benchmarks/graphalytics/datagen-sf3k-fb.md5"><code>datagen-sf3k-fb</code></a>, <a href="/benchmarks/graphalytics/datagen-sf10k-fb.md5"><code>datagen-sf10k-fb</code></a>, <a href="/benchmarks/graphalytics/graph500-27.md5"><code>graph500-27</code></a>, <a href="/benchmarks/graphalytics/graph500-28.md5"><code>graph500-28</code></a>, <a href="/benchmarks/graphalytics/graph500-29.md5"><code>graph500-29</code></a>, <a href="/benchmarks/graphalytics/graph500-30.md5"><code>graph500-30</code></a>.</p>
+<table>
+<thead>
+<tr>
+<th>data set</th>
+<th>#nodes</th>
+<th>#edges</th>
+<th>scale</th>
+<th>link</th>
+<th>size</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>cit-Patents</td>
+<td>3,774,768</td>
+<td>16,518,947</td>
+<td>XS</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/cit-Patents.tar.zst"><code>cit-Patents.tar.zst</code></a></td>
+<td>119.1 MB</td>
+</tr>
+<tr>
+<td>com-friendster</td>
+<td>65,608,366</td>
+<td>1,806,067,135</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/com-friendster.tar.zst"><code>com-friendster.tar.zst</code></a></td>
+<td>6.7 GB</td>
+</tr>
+<tr>
+<td>datagen-7_5-fb</td>
+<td>633,432</td>
+<td>34,185,747</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_5-fb.tar.zst"><code>datagen-7_5-fb.tar.zst</code></a></td>
+<td>162.3 MB</td>
+</tr>
+<tr>
+<td>datagen-7_6-fb</td>
+<td>754,147</td>
+<td>42,162,988</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_6-fb.tar.zst"><code>datagen-7_6-fb.tar.zst</code></a></td>
+<td>200.0 MB</td>
+</tr>
+<tr>
+<td>datagen-7_7-zf</td>
+<td>13,180,508</td>
+<td>32,791,267</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_7-zf.tar.zst"><code>datagen-7_7-zf.tar.zst</code></a></td>
+<td>434.5 MB</td>
+</tr>
+<tr>
+<td>datagen-7_8-zf</td>
+<td>16,521,886</td>
+<td>41,025,255</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_8-zf.tar.zst"><code>datagen-7_8-zf.tar.zst</code></a></td>
+<td>544.3 MB</td>
+</tr>
+<tr>
+<td>datagen-7_9-fb</td>
+<td>1,387,587</td>
+<td>85,670,523</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_9-fb.tar.zst"><code>datagen-7_9-fb.tar.zst</code></a></td>
+<td>401.2 MB</td>
+</tr>
+<tr>
+<td>datagen-8_0-fb</td>
+<td>1,706,561</td>
+<td>107,507,376</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_0-fb.tar.zst"><code>datagen-8_0-fb.tar.zst</code></a></td>
+<td>502.5 MB</td>
+</tr>
+<tr>
+<td>datagen-8_1-fb</td>
+<td>2,072,117</td>
+<td>134,267,822</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_1-fb.tar.zst"><code>datagen-8_1-fb.tar.zst</code></a></td>
+<td>625.4 MB</td>
+</tr>
+<tr>
+<td>datagen-8_2-zf</td>
+<td>43,734,497</td>
+<td>106,440,188</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_2-zf.tar.zst"><code>datagen-8_2-zf.tar.zst</code></a></td>
+<td>1.4 GB</td>
+</tr>
+<tr>
+<td>datagen-8_3-zf</td>
+<td>53,525,014</td>
+<td>130,579,909</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_3-zf.tar.zst"><code>datagen-8_3-zf.tar.zst</code></a></td>
+<td>1.7 GB</td>
+</tr>
+<tr>
+<td>datagen-8_4-fb</td>
+<td>3,809,084</td>
+<td>269,479,177</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_4-fb.tar.zst"><code>datagen-8_4-fb.tar.zst</code></a></td>
+<td>1.2 GB</td>
+</tr>
+<tr>
+<td>datagen-8_5-fb</td>
+<td>4,599,739</td>
+<td>332,026,902</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_5-fb.tar.zst"><code>datagen-8_5-fb.tar.zst</code></a></td>
+<td>1.5 GB</td>
+</tr>
+<tr>
+<td>datagen-8_6-fb</td>
+<td>5,667,674</td>
+<td>421,988,619</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_6-fb.tar.zst"><code>datagen-8_6-fb.tar.zst</code></a></td>
+<td>1.9 GB</td>
+</tr>
+<tr>
+<td>datagen-8_7-zf</td>
+<td>145,050,709</td>
+<td>340,157,363</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_7-zf.tar.zst"><code>datagen-8_7-zf.tar.zst</code></a></td>
+<td>4.6 GB</td>
+</tr>
+<tr>
+<td>datagen-8_8-zf</td>
+<td>168,308,893</td>
+<td>413,354,288</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_8-zf.tar.zst"><code>datagen-8_8-zf.tar.zst</code></a></td>
+<td>5.3 GB</td>
+</tr>
+<tr>
+<td>datagen-8_9-fb</td>
+<td>10,572,901</td>
+<td>848,681,908</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_9-fb.tar.zst"><code>datagen-8_9-fb.tar.zst</code></a></td>
+<td>3.7 GB</td>
+</tr>
+<tr>
+<td>datagen-9_0-fb</td>
+<td>12,857,671</td>
+<td>1,049,527,225</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_0-fb.tar.zst"><code>datagen-9_0-fb.tar.zst</code></a></td>
+<td>4.6 GB</td>
+</tr>
+<tr>
+<td>datagen-9_1-fb</td>
+<td>16,087,483</td>
+<td>1,342,158,397</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_1-fb.tar.zst"><code>datagen-9_1-fb.tar.zst</code></a></td>
+<td>5.8 GB</td>
+</tr>
+<tr>
+<td>datagen-9_2-zf</td>
+<td>434,943,376</td>
+<td>1,042,340,732</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_2-zf.tar.zst"><code>datagen-9_2-zf.tar.zst</code></a></td>
+<td>13.7 GB</td>
+</tr>
+<tr>
+<td>datagen-9_3-zf</td>
+<td>555,270,053</td>
+<td>1,309,998,551</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_3-zf.tar.zst"><code>datagen-9_3-zf.tar.zst</code></a></td>
+<td>17.4 GB</td>
+</tr>
+<tr>
+<td>datagen-9_4-fb</td>
+<td>29,310,565</td>
+<td>2,588,948,669</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_4-fb.tar.zst"><code>datagen-9_4-fb.tar.zst</code></a></td>
+<td>14.0 GB</td>
+</tr>
+<tr>
+<td>datagen-sf3k-fb</td>
+<td>33,484,375</td>
+<td>2,912,009,743</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf3k-fb.tar.zst"><code>datagen-sf3k-fb.tar.zst</code></a></td>
+<td>12.7 GB</td>
+</tr>
+<tr>
+<td>datagen-sf10k-fb</td>
+<td>100,218,750</td>
+<td>9,404,822,538</td>
+<td>2XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf10k-fb.tar.zst"><code>datagen-sf10k-fb.tar.zst</code></a></td>
+<td>40.5 GB</td>
+</tr>
+<tr>
+<td>dota-league</td>
+<td>61,170</td>
+<td>50,870,313</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/dota-league.tar.zst"><code>dota-league.tar.zst</code></a></td>
+<td>114.3 MB</td>
+</tr>
+<tr>
+<td>graph500-22</td>
+<td>2,396,657</td>
+<td>64,155,735</td>
+<td>S</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-22.tar.zst"><code>graph500-22.tar.zst</code></a></td>
+<td>202.4 MB</td>
+</tr>
+<tr>
+<td>graph500-23</td>
+<td>4,610,222</td>
+<td>129,333,677</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-23.tar.zst"><code>graph500-23.tar.zst</code></a></td>
+<td>410.6 MB</td>
+</tr>
+<tr>
+<td>graph500-24</td>
+<td>8,870,942</td>
+<td>260,379,520</td>
+<td>M</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-24.tar.zst"><code>graph500-24.tar.zst</code></a></td>
+<td>847.7 MB</td>
+</tr>
+<tr>
+<td>graph500-25</td>
+<td>17,062,472</td>
+<td>523,602,831</td>
+<td>L</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-25.tar.zst"><code>graph500-25.tar.zst</code></a></td>
+<td>1.7 GB</td>
+</tr>
+<tr>
+<td>graph500-26</td>
+<td>32,804,978</td>
+<td>1,051,922,853</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-26.tar.zst"><code>graph500-26.tar.zst</code></a></td>
+<td>3.4 GB</td>
+</tr>
+<tr>
+<td>graph500-27</td>
+<td>63,081,040</td>
+<td>2,111,642,032</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-27.tar.zst"><code>graph500-27.tar.zst</code></a></td>
+<td>7.1 GB</td>
+</tr>
+<tr>
+<td>graph500-28</td>
+<td>121,242,388</td>
+<td>4,236,163,958</td>
+<td>2XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-28.tar.zst"><code>graph500-28.tar.zst</code></a></td>
+<td>14.4 GB</td>
+</tr>
+<tr>
+<td>graph500-29</td>
+<td>232,999,630</td>
+<td>8,493,569,115</td>
+<td>2XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-29.tar.zst"><code>graph500-29.tar.zst</code></a></td>
+<td>29.6 GB</td>
+</tr>
+<tr>
+<td>graph500-30</td>
+<td>447,797,986</td>
+<td>17,022,117,362</td>
+<td>3XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-30.tar.zst"><code>graph500-30.tar.zst</code></a></td>
+<td>60.8 GB</td>
+</tr>
+<tr>
+<td>kgs</td>
+<td>832,247</td>
+<td>17,891,698</td>
+<td>XS</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/kgs.tar.zst"><code>kgs.tar.zst</code></a></td>
+<td>65.7 MB</td>
+</tr>
+<tr>
+<td>twitter_mpi</td>
+<td>52,579,678</td>
+<td>1,963,263,508</td>
+<td>XL</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/twitter_mpi.tar.zst"><code>twitter_mpi.tar.zst</code></a></td>
+<td>5.7 GB</td>
+</tr>
+<tr>
+<td>wiki-Talk</td>
+<td>2,394,385</td>
+<td>5,021,410</td>
+<td>2XS</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/wiki-Talk.tar.zst"><code>wiki-Talk.tar.zst</code></a></td>
+<td>34.9 MB</td>
+</tr>
+<tr>
+<td>example-directed</td>
+<td>10</td>
+<td>17</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-directed.tar.zst"><code>example-directed.tar.zst</code></a></td>
+<td>1.0 KB</td>
+</tr>
+<tr>
+<td>example-undirected</td>
+<td>9</td>
+<td>12</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-undirected.tar.zst"><code>example-undirected.tar.zst</code></a></td>
+<td>1.0 KB</td>
+</tr>
+<tr>
+<td>test-bfs-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-directed.tar.zst"><code>test-bfs-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-bfs-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-undirected.tar.zst"><code>test-bfs-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-cdlp-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-directed.tar.zst"><code>test-cdlp-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-cdlp-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-undirected.tar.zst"><code>test-cdlp-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-pr-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-directed.tar.zst"><code>test-pr-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-pr-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-undirected.tar.zst"><code>test-pr-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-lcc-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-directed.tar.zst"><code>test-lcc-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-lcc-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-undirected.tar.zst"><code>test-lcc-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-wcc-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-directed.tar.zst"><code>test-wcc-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-wcc-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-undirected.tar.zst"><code>test-wcc-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-sssp-directed</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-directed.tar.zst"><code>test-sssp-directed.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+<tr>
+<td>test-sssp-undirected</td>
+<td>&lt;100</td>
+<td>&lt;100</td>
+<td>-</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-undirected.tar.zst"><code>test-sssp-undirected.tar.zst</code></a></td>
+<td>&lt;2.0 KB</td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/graphalytics/spec-graphalytics-competitions.pdf b/benchmarks/graphalytics/spec-graphalytics-competitions.pdf
new file mode 100644
index 00000000..51a0a47d
Binary files /dev/null and b/benchmarks/graphalytics/spec-graphalytics-competitions.pdf differ
diff --git a/benchmarks/index.html b/benchmarks/index.html
new file mode 100644
index 00000000..970509c1
--- /dev/null
+++ b/benchmarks/index.html
@@ -0,0 +1,777 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/">Posts</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/index.xml b/benchmarks/index.xml
new file mode 100644
index 00000000..6ce56524
--- /dev/null
+++ b/benchmarks/index.xml
@@ -0,0 +1,5467 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Benchmarks on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/benchmarks/</link>
+    <description>Recent content in Benchmarks on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright><atom:link href="https://ldbcouncil.org/benchmarks/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/benchmarks/overview/index.html b/benchmarks/overview/index.html
new file mode 100644
index 00000000..a43ae549
--- /dev/null
+++ b/benchmarks/overview/index.html
@@ -0,0 +1,356 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Overview of LDBC Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Overview of LDBC Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Overview of LDBC Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>LDBC currently offers the following benchmarks:</p>
+<ul>
+<li><strong><a href="/benchmarks/graphalytics">Graphalytics</a>:</strong> Graph algorithms for graph analytical platforms</li>
+<li><strong><a href="/benchmarks/finbench">Financial Benchmark</a>:</strong> Benchmark for financial workloads, targeting distributed systems</li>
+<li><strong><a href="/benchmarks/spb">Semantic Publishing Benchmark</a>:</strong> An RDF-based benchmark for semantic databases</li>
+<li><strong><a href="/benchmarks/snb">Social Network Benchmark Suite (SNB)</a>:</strong> The SNB targets database management systems with graph-processing capabilities. It consists of two workloads, Interactive and Business Intelligence</li>
+</ul>
+<p>Uses of LDBC benchmarks are subject to the <a href="/benchmarks/fair-use-policies">Fair Use Policy for LDBC Benchmarks</a>.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/1/index.html b/benchmarks/page/1/index.html
new file mode 100644
index 00000000..7060f873
--- /dev/null
+++ b/benchmarks/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/">
+  </head>
+</html>
diff --git a/benchmarks/page/2/index.html b/benchmarks/page/2/index.html
new file mode 100644
index 00000000..b1b496f0
--- /dev/null
+++ b/benchmarks/page/2/index.html
@@ -0,0 +1,804 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/3/index.html b/benchmarks/page/3/index.html
new file mode 100644
index 00000000..4441eea2
--- /dev/null
+++ b/benchmarks/page/3/index.html
@@ -0,0 +1,796 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/4/index.html b/benchmarks/page/4/index.html
new file mode 100644
index 00000000..05144fba
--- /dev/null
+++ b/benchmarks/page/4/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/5/index.html b/benchmarks/page/5/index.html
new file mode 100644
index 00000000..9298d051
--- /dev/null
+++ b/benchmarks/page/5/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/6/index.html b/benchmarks/page/6/index.html
new file mode 100644
index 00000000..6f1a9f0c
--- /dev/null
+++ b/benchmarks/page/6/index.html
@@ -0,0 +1,776 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/7/index.html b/benchmarks/page/7/index.html
new file mode 100644
index 00000000..7166902d
--- /dev/null
+++ b/benchmarks/page/7/index.html
@@ -0,0 +1,794 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/8/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/page/8/index.html b/benchmarks/page/8/index.html
new file mode 100644
index 00000000..4857bae8
--- /dev/null
+++ b/benchmarks/page/8/index.html
@@ -0,0 +1,709 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarks</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Benchmarks</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Benchmarks</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/benchmarks/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/benchmarks/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/benchmarks/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/snb-bi/index.html b/benchmarks/snb-bi/index.html
new file mode 100644
index 00000000..cac5312a
--- /dev/null
+++ b/benchmarks/snb-bi/index.html
@@ -0,0 +1,566 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC SNB Business Intelligence workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC SNB Business Intelligence workload</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC SNB Business Intelligence workload</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- members -->
+<section class="section">
+  
+
+
+<div class="container">
+    <div class="row">
+        <div class="col-lg-12">
+            <div class="content">
+                <div><p>The <strong><a href="/benchmarks/snb">LDBC SNB</a> Business Intelligence workload</strong> is focusing on aggregation- and join-heavy complex queries touching a large portion of the graph with microbatches of insert/delete operations. Its data sets are available in <a href="https://github.com/ldbc/ldbc_snb_bi/blob/main/snb-bi-pre-generated-data-sets.md">Cloudflare R2</a>.</p>
+<p>For an overview of the workload, see the <a href="/docs/papers/ldbc-snb-bi-vldb-2023.pdf">VLDB 2023 paper</a> and <a href="/docs/presentations/vldb-2023-ldbc-snb-bi-slides-szarnyasg.pdf">its presentation</a> by Gabor Szarnyas.</p>
+<p>The workload produces scoring metrics for performance (power and throughput scores) at the given scale and price/performance metrics. The full disclosure reports (FDR) further break down the composition of the metric into its constituent parts, e.g. single query execution times.</p>
+<p>Note that the system cost is the sum of the license, hardware, and maintenance costs, where maintenance means 24/7 support with a response time of less than 4 hours.</p>
+</div>
+
+                <h3>Audited results</h3>
+
+                
+                <table>
+                <thead style="font-weight: bold; text-align: center">
+                <tr>
+                    <th style="width: 22%">Benchmark setup</th>
+                    <th>SF</th>
+                    <th>Hardware</th>
+                    <th>Performance metrics and cost</th>
+                    <th style="width: 22%">Documents</th>
+                </tr>
+                </thead>
+                <tbody><tr>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li>System: <a href="https://www.tugraph.org/"><b>TuGraph 0.9</b></a></li>
+                            <li>Test sponsor: <a href="https://www.tugraph.org/"><b>TuGraph, Ant Yunchuang Digital Technology (Beijing) Co., Ltd.</b></a></li>
+                            <li>Date: <time style="white-space: nowrap"><b>2023-12-03</b></time></li>
+                            
+                            
+                            <li>Query language: <b>Gremlin</b></li>
+                            <li>System cost: <b>5,649,500&nbsp;USD</b></li>
+                        </ul>
+                    </td>
+                    
+                    <td style="text-align: right!important">30,000</td>
+                    <td>72 Alibaba Cloud ecs.r7.16xlarge instances:<br/>64×Intel&nbsp;Xeon&nbsp;Platinum&nbsp;8369B&nbsp;vCPUs,&nbsp;<br/>512&nbsp;GiB&nbsp;RAM per instance<br/></td>
+                    <td>
+                        <ul>
+                            <li>Power@SF:&nbsp;111,775.39</li>
+                            <li>Power@SF&nbsp;(price&#8209;adjusted):&nbsp;19.79</li>
+                            <li>Throughput@SF:&nbsp;56,920.48</li>
+                            <li>Throughput@SF&nbsp;(price&#8209;adjusted):&nbsp;10.08</li>
+                        </ul>
+                    </td>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph.pdf">Full disclosure report</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-executive_summary.pdf">Executive summary</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-signatures.pdf">Signatures</a></li>
+                            <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20231203_SF30000_tugraph-attachments.tar.gz">Supplementary package</a></li>
+                        </ul>
+                    </td>
+                    
+                </tr>
+                
+                <tr>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li>System: <a href="https://docs.tigergraph.com/tigergraph-server/3.7"><b>TigerGraph 3.7.0</b></a></li>
+                            <li>Test sponsor: <a href="https://tigergraph.com/"><b>TigerGraph</b></a></li>
+                            <li>Date: <time style="white-space: nowrap"><b>2023-04-06</b></time></li>
+                            
+                            
+                            <li>Query language: <b>GSQL</b></li>
+                            <li>System cost: <b>142,815&nbsp;USD</b></li>
+                        </ul>
+                    </td>
+                    
+                    <td style="text-align: right!important">100</td>
+                    <td>1 AWS r6a.4xlarge instance:<br/>16×AMD&nbsp;EPYC&nbsp;7R13&nbsp;vCPUs,<br/>128GiB&nbsp;RAM<br/></td>
+                    <td>
+                        <ul>
+                            <li>Power@SF:&nbsp;6,253.72</li>
+                            <li>Power@SF&nbsp;(price&#8209;adjusted):&nbsp;43.79</li>
+                            <li>Throughput@SF:&nbsp;3,723.44</li>
+                            <li>Throughput@SF&nbsp;(price&#8209;adjusted):&nbsp;26.07</li>
+                        </ul>
+                    </td>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph.pdf">Full disclosure report</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph-executive_summary.pdf">Executive summary</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf">Signatures</a></li>
+                            <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz">Supplementary package</a></li>
+                        </ul>
+                    </td>
+                    
+                </tr>
+                
+                <tr>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li>System: <a href="https://docs.tigergraph.com/tigergraph-server/3.7"><b>TigerGraph 3.7.0</b></a></li>
+                            <li>Test sponsor: <a href="https://tigergraph.com/"><b>TigerGraph</b></a></li>
+                            <li>Date: <time style="white-space: nowrap"><b>2023-04-06</b></time></li>
+                            
+                            
+                            <li>Query language: <b>GSQL</b></li>
+                            <li>System cost: <b>1,302,174&nbsp;USD</b></li>
+                        </ul>
+                    </td>
+                    
+                    <td style="text-align: right!important">1,000</td>
+                    <td>4 AWS r6a.8xlarge instances:<br/>32×AMD&nbsp;EPYC&nbsp;7R13&nbsp;vCPUs,<br/>256GiB&nbsp;RAM per instance<br/></td>
+                    <td>
+                        <ul>
+                            <li>Power@SF:&nbsp;23,951.74</li>
+                            <li>Power@SF&nbsp;(price&#8209;adjusted):&nbsp;18.39</li>
+                            <li>Throughput@SF:&nbsp;10,605.12</li>
+                            <li>Throughput@SF&nbsp;(price&#8209;adjusted):&nbsp;8.14</li>
+                        </ul>
+                    </td>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph.pdf">Full disclosure report</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph-executive_summary.pdf">Executive summary</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf">Signatures</a></li>
+                            <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz">Supplementary package</a></li>
+                        </ul>
+                    </td>
+                    
+                </tr>
+                
+                <tr>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li>System: <a href="https://docs.tigergraph.com/tigergraph-server/3.7"><b>TigerGraph 3.7.0</b></a></li>
+                            <li>Test sponsor: <a href="https://tigergraph.com/"><b>TigerGraph</b></a></li>
+                            <li>Date: <time style="white-space: nowrap"><b>2023-04-06</b></time></li>
+                            
+                            
+                            <li>Query language: <b>GSQL</b></li>
+                            <li>System cost: <b>7,871,354&nbsp;USD</b></li>
+                        </ul>
+                    </td>
+                    
+                    <td style="text-align: right!important">10,000</td>
+                    <td>48 AWS r6a.8xlarge instances:<br/>32×AMD&nbsp;EPYC&nbsp;7R13&nbsp;vCPUs,<br/>256GiB&nbsp;RAM per instance<br/></td>
+                    <td>
+                        <ul>
+                            <li>Power@SF:&nbsp;89,444.50</li>
+                            <li>Power@SF&nbsp;(price&#8209;adjusted):&nbsp;11.36</li>
+                            <li>Throughput@SF:&nbsp;41,025.76</li>
+                            <li>Throughput@SF&nbsp;(price&#8209;adjusted):&nbsp;5.21</li>
+                        </ul>
+                    </td>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph.pdf">Full disclosure report</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph-executive_summary.pdf">Executive summary</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf">Signatures</a></li>
+                            <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz">Supplementary package</a></li>
+                        </ul>
+                    </td>
+                    
+                </tr>
+                
+                <tr>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li>System: <a href="https://docs.tigergraph.com/tigergraph-server/3.7"><b>TigerGraph 3.7.0</b></a></li>
+                            <li>Test sponsor: <a href="https://tigergraph.com/"><b>TigerGraph</b></a></li>
+                            <li>Date: <time style="white-space: nowrap"><b>2022-11-09</b></time></li>
+                            
+                            
+                            <li>Query language: <b>GSQL</b></li>
+                            <li>System cost: <b>1,353,315&nbsp;USD</b></li>
+                        </ul>
+                    </td>
+                    
+                    <td style="text-align: right!important">1,000</td>
+                    <td>Dell PowerEdge 6625 with<br/>64×AMD EPYC 9354 CPU cores and<br/>1.5TiB RAM<br/></td>
+                    <td>
+                        <ul>
+                            <li>Power@SF:&nbsp;30,990.08</li>
+                            <li>Power@SF&nbsp;(price&#8209;adjusted):&nbsp;22.90</li>
+                            <li>Throughput@SF:&nbsp;12,993.85</li>
+                            <li>Throughput@SF&nbsp;(price&#8209;adjusted):&nbsp;9.60</li>
+                        </ul>
+                    </td>
+                    
+                    <td rowspan="1">
+                        <ul>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph.pdf">Full disclosure report</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-executive_summary.pdf">Executive summary</a></li>
+                            <li><a href="/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-signatures.pdf">Signatures</a></li>
+                            <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20221109_SF1000_tigergraph-attachments.tar.gz">Supplementary package</a></li>
+                        </ul>
+                    </td>
+                    
+                </tr>
+                
+                
+                </tbody>
+                </table>
+                
+
+                <p>The audited LDBC SNB BI results displayed above are available as <a href="/data/snb_bi.csv">a CSV file</a>.</p>
+<h3 id="ldbc-certified-auditors">LDBC-certified auditors</h3>
+<p>SNB BI audits can be commissioned from the following LDBC-certified auditors:</p>
+<ul>
+<li>Fabian Murariu (Pometry Ltd.)</li>
+<li>David Püroja</li>
+</ul>
+
+            </div>
+        </div>
+    </div>
+</div>
+
+
+</section>
+<!-- /members -->
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/snb-interactive/index.html b/benchmarks/snb-interactive/index.html
new file mode 100644
index 00000000..42f80aaf
--- /dev/null
+++ b/benchmarks/snb-interactive/index.html
@@ -0,0 +1,753 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC SNB Interactive workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC SNB Interactive workload</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC SNB Interactive workload</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- members -->
+<section class="section">
+  
+
+
+<div class="container">
+    <div class="row">
+        <div class="col-lg-12">
+            <div class="content">
+                <div><p>The <strong><a href="/benchmarks/snb">LDBC SNB</a> Interactive workload</strong> captures transactional graph processing scenario with complex read queries that access the neighbourhood of a given node in the graph and update operations that continuously insert new data in the graph. Its data sets are available in the <a href="https://hdl.handle.net/11112/e6e00558-a2c3-9214-473e-04a16de09bf8">CWI/SURF data repository</a>.</p>
+<p>The workload produces the throughput metric to characterize the performance at the given scale. The full disclosure reports (FDR) further detail the performance of the system under test by listing the data loading time and single query execution times.</p>
+<p>Note that the system cost is the sum of the license, hardware, and maintenance costs, where maintenance means 24/7 support with a response time of less than 4 hours.</p>
+</div>
+
+                
+                <h3>Audited results using a declarative query language</h3>
+                <table>
+                    <thead style="font-weight: bold; text-align: center">
+                    <tr>
+                        <th style="width: 22%">Benchmark setup</th>
+                        <th>SF</th>
+                        <th>Hardware</th>
+                        <th>Throughput</th>
+                        <th style="width: 20%">Documents</th>
+                    </tr>
+                    </thead>
+                    <tbody>
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://graphdb.ontotext.com/"><b>GraphDB 10.1.1</b></a></li>
+                                <li>Test sponsor: <a href="https://www.ontotext.com/"><b>Ontotext</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2023-01-31</b></time></li>
+                                
+                                
+                                <li>Query language: <b>SPARQL</b></li>
+                                <li>System cost: <b>216,222&nbsp;USD</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r6id.8xlarge, 256GiB RAM,<br/>32×Intel Xeon Platinum 8375C vCPUs,<br/>1 read thread, 1 write thread<br/></td>
+                        <td style="text-align: right!important">3.04&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230131_SF30_graphdb-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r6id.8xlarge, 256GiB RAM,<br/>32×Intel Xeon Platinum 8375C vCPUs,<br/>2 read threads, 2 write threads<br/></td>
+                        <td style="text-align: right!important">6.76&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r6id.8xlarge, 256GiB RAM,<br/>32×Intel Xeon Platinum 8375C vCPUs,<br/>4 read threads, 4 write threads<br/></td>
+                        <td style="text-align: right!important">12.16&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    
+                    </tbody>
+                </table>
+                
+
+                
+                <h3>Audited results using an imperative language</h3>
+                <table>
+                    <thead style="font-weight: bold; text-align: center">
+                    <tr>
+                        <th style="width: 25%">Benchmark setup</th>
+                        <th>SF</th>
+                        <th>Hardware</th>
+                        <th>Throughput</th>
+                        <th style="width: 20%">Documents</th>
+                    </tr>
+                    </thead>
+                    <tbody>
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://github.com/alibaba/GraphScope"><b>GraphScope Flex 0.26.1</b></a></li>
+                                <li>Test sponsor: <a href="https://www.alibabacloud.com/"><b>Alibaba Cloud</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2024-05-14</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>C&#43;&#43; stored procedures</b></li>
+                                <li>System cost: <b>738,724&nbsp;RMB</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM,<br/>64×AMD EPYC 9T24 @ 3.7GHz vCPUs<br/></td>
+                        <td style="text-align: right!important">130,098.36&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM,<br/>64×AMD EPYC 9T24 @ 3.7GHz vCPUs<br/></td>
+                        <td style="text-align: right!important">131,263.87&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">1000</td>
+                        <td>Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM,<br/>64×AMD EPYC 9T24 @ 3.7GHz vCPUs<br/></td>
+                        <td style="text-align: right!important">127,784.51&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://atlasgraph.io/"><b>AtlasGraph 3.0.0</b></a></li>
+                                <li>Test sponsor: <a href="https://www.stargraph.cn/"><b>StarGraph</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2023-12-25</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>Rust stored procedures</b></li>
+                                <li>System cost: <b>2,032,461&nbsp;RMB</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">37,631.25&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">48,764.08&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">48,311.63&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://github.com/alibaba/GraphScope"><b>GraphScope Flex 0.23.0</b></a></li>
+                                <li>Test sponsor: <a href="https://damo.alibaba.com/"><b>Alibaba DAMO Academy</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2023-07-13</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>C&#43;&#43; stored procedures</b></li>
+                                <li>System cost: <b>99,236&nbsp;USD</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">33,180.87&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230713_SF30-100-300_GraphscopeFlex-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">33,625.36&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">33,261.38&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://github.com/tugraph-db/tugraph-db"><b>TuGraph 3.3.4</b></a></li>
+                                <li>Test sponsor: <a href="https://www.antgroup.com/en"><b>Ant Group</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2023-01-28</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>C&#43;&#43; stored procedures</b></li>
+                                <li>System cost: <b>277,542&nbsp;RMB</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM,<br/>64×Arm-based YiTian 710 vCPUs<br/></td>
+                        <td style="text-align: right!important">16,133.08&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230128_SF30-100-300_tugraph-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM,<br/>64×Arm-based YiTian 710 vCPUs<br/></td>
+                        <td style="text-align: right!important">16,966.26&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM,<br/>64×Arm-based YiTian 710 vCPUs<br/></td>
+                        <td style="text-align: right!important">13,532.62&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://tech.antfin.com/products/TuGraph"><b>TuGraph 3.2.0</b></a></li>
+                                <li>Test sponsor: <a href="https://www.antgroup.com/en"><b>Ant Group</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2022-08-16</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>C&#43;&#43; stored procedures</b></li>
+                                <li>System cost: <b>291,176&nbsp;USD</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">12,252.50&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20200726_SF30-100-300_tugraph-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">12,934.61&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>AWS r5d.12xlarge, 384GiB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">12,721.24&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://galaxybase.com/"><b>Galaxybase 3.3.0</b></a></li>
+                                <li>Test sponsor: <a href="https://galaxybase.com/"><b>CreateLink</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2022-05-16</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>Java stored procedures</b></li>
+                                <li>System cost: <b>263,282&nbsp;USD</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r5d.12xlarge, 372GB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">9,285.86&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>AWS r5d.12xlarge, 372GB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">8,501.21&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>AWS r5d.12xlarge, 372GB RAM,<br/>48×Intel Xeon Platinum 8259CL vCPUs<br/></td>
+                        <td style="text-align: right!important">8,370.52&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    <tr>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li>System: <a href="https://fma-ai.cn/"><b>TuGraph 1.1</b></a></li>
+                                <li>Test sponsor: <a href="https://fma-ai.cn/"><b>FMA</b></a></li>
+                                <li>Date: <time style="white-space: nowrap"><b>2020-07-26</b></time></li>
+                                
+                                
+                                <li>Queries implemented in: <b>C&#43;&#43; stored procedures</b></li>
+                                <li>System cost: <b>280,650&nbsp;USD</b></li>
+                            </ul>
+                        </td>
+                        
+                        <td style="text-align: right!important">30</td>
+                        <td>AWS r5d.12xlarge, 374GB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">5,436.47&nbsp;ops/s</td>
+                        
+                        <td rowspan="3">
+                            <ul>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf">Full disclosure report</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf">Executive summary</a></li>
+                                <li><a href="/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf">Signatures</a></li>
+                                <li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220816_SF30-100-300_tugraph-attachments.tar.gz">Supplementary package</a></li>
+                            </ul>
+                        </td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">100</td>
+                        <td>AWS r5d.12xlarge, 374GB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">5,010.77&nbsp;ops/s</td>
+                        
+                    </tr>
+                    <tr>
+                        
+                        <td style="text-align: right!important">300</td>
+                        <td>AWS r5d.12xlarge, 374GB RAM,<br/>48×Intel Xeon Platinum 8175M vCPUs<br/></td>
+                        <td style="text-align: right!important">4,855.52&nbsp;ops/s</td>
+                        
+                    </tr>
+                    
+                    
+                    </tbody>
+                </table>
+                
+
+                <h3 id="results-as-a-csv-file">Results as a CSV file</h3>
+<p>The audited LDBC SNB Interactive results displayed above are available as <a href="/data/snb_interactive.csv">a CSV file</a>.</p>
+<h3 id="ldbc-certified-auditors">LDBC-certified auditors</h3>
+<p>SNB Interactive audits can be commissioned from the following LDBC-certified auditors:</p>
+<ul>
+<li>Márton Búr</li>
+<li>Arnau Prat-Pérez</li>
+<li>David Püroja</li>
+</ul>
+<h3 id="legacy-audited-results">Legacy audited results</h3>
+<p><a href="/benchmarks/snb/audited-results-v0.2.2">Social Network Benchmark Interactive, version 0.2.2</a></p>
+<h3 id="future-workloads">Future workloads</h3>
+<p>The LDBC SNB Interactive v2 workload is currently under development. See the TPCTC 2023 paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf">&ldquo;The LDBC Social Network Benchmark Interactive Workload v2: A Transactional Graph Query Benchmark with Deep Delete Operations&rdquo;</a> and its <a href="https://ldbcouncil.org/docs/presentations/tpctc-2023-ldbc-snb-interactive-v2.pdf">slide deck</a> for details.</p>
+
+            </div>
+        </div>
+    </div>
+</div>
+
+
+</section>
+<!-- /members -->
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-executive_summary.pdf
new file mode 100644
index 00000000..92155d75
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-signatures.pdf
new file mode 100644
index 00000000..a4c50672
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph.pdf b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph.pdf
new file mode 100644
index 00000000..63b7b02b
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20221109_SF1000_tigergraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph-executive_summary.pdf
new file mode 100644
index 00000000..a549af81
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph.pdf
new file mode 100644
index 00000000..e8688813
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF10000_tigergraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph-executive_summary.pdf
new file mode 100644
index 00000000..3e284938
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph.pdf
new file mode 100644
index 00000000..8a8c06d7
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF1000_tigergraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf
new file mode 100644
index 00000000..6a43472f
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph-executive_summary.pdf
new file mode 100644
index 00000000..e1930c2b
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph.pdf b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph.pdf
new file mode 100644
index 00000000..4e1ce728
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20230406_SF100_tigergraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-executive_summary.pdf
new file mode 100644
index 00000000..49e9e3cf
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-signatures.pdf
new file mode 100644
index 00000000..4b8322ac
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph.pdf b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph.pdf
new file mode 100644
index 00000000..4c2c8ba5
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_BI_20231203_SF30000_tugraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF100_sparksee.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF100_sparksee.pdf
new file mode 100644
index 00000000..29af3830
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF100_sparksee.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF100_virtuoso.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF100_virtuoso.pdf
new file mode 100644
index 00000000..064b348c
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF100_virtuoso.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF10_sparksee.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF10_sparksee.pdf
new file mode 100644
index 00000000..e3908056
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF10_sparksee.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF300_virtuoso.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF300_virtuoso.pdf
new file mode 100644
index 00000000..8cd9fecd
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF300_virtuoso.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF30_sparksee.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF30_sparksee.pdf
new file mode 100644
index 00000000..c97aa8eb
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF30_sparksee.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20150427_SF30_virtuoso.pdf b/benchmarks/snb/LDBC_SNB_I_20150427_SF30_virtuoso.pdf
new file mode 100644
index 00000000..d18bd7ca
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20150427_SF30_virtuoso.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf
new file mode 100644
index 00000000..20ba1174
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf
new file mode 100644
index 00000000..808c2e18
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf
new file mode 100644
index 00000000..ef07701f
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf
new file mode 100644
index 00000000..33e6a074
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf
new file mode 100644
index 00000000..60b2d6dc
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf
new file mode 100644
index 00000000..380c2c56
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf
new file mode 100644
index 00000000..93cda796
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf
new file mode 100644
index 00000000..6cb96bac
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf
new file mode 100644
index 00000000..61ea8cfa
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf
new file mode 100644
index 00000000..1843d2a8
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf
new file mode 100644
index 00000000..44f34eb1
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf
new file mode 100644
index 00000000..a45d8dc1
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf
new file mode 100644
index 00000000..2cb9c47c
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf
new file mode 100644
index 00000000..14bc45bb
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb.pdf b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb.pdf
new file mode 100644
index 00000000..107daba5
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230131_SF30_graphdb.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf
new file mode 100644
index 00000000..41fc60d1
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf
new file mode 100644
index 00000000..7b79ec81
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf
new file mode 100644
index 00000000..f485d158
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf
new file mode 100644
index 00000000..2b9fc924
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf
new file mode 100644
index 00000000..bb70d112
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf
new file mode 100644
index 00000000..e94c0647
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf
new file mode 100644
index 00000000..88dcb08e
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf
new file mode 100644
index 00000000..3fabcbad
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf differ
diff --git a/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf
new file mode 100644
index 00000000..d5046940
Binary files /dev/null and b/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf differ
diff --git a/benchmarks/snb/audited-results-v0.2.2/index.html b/benchmarks/snb/audited-results-v0.2.2/index.html
new file mode 100644
index 00000000..d3214043
--- /dev/null
+++ b/benchmarks/snb/audited-results-v0.2.2/index.html
@@ -0,0 +1,425 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Social Network Benchmark legacy audited results</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Social Network Benchmark legacy audited results</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Social Network Benchmark legacy audited results</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <h2 id="snb-interactive-version-022httpsgithubcomldbcldbc_snb_docsblob8d325657069b444dd79fe21c770ecc9d88cc2c53ldbc_snb_v022pdf-audited-results">SNB Interactive (<a href="https://github.com/ldbc/ldbc_snb_docs/blob/8d325657069b444dd79fe21c770ecc9d88cc2c53/LDBC_SNB_v0.2.2.pdf">version 0.2.2</a>) audited results</h2>
+<table>
+<thead>
+<tr>
+<th style="text-align:right"><strong>SF</strong></th>
+<th><strong>Throughput</strong></th>
+<th><strong>Cost</strong></th>
+<th><strong>Software</strong></th>
+<th><strong>Hardware</strong></th>
+<th><strong>Test Sponsor</strong></th>
+<th><strong>Date</strong></th>
+<th><strong>Full Disclosure Report</strong></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">10</div></td>
+<td><div style="text-align:right!important; margin-left:0">101.20 ops/s</div></td>
+<td>30,427 EUR</td>
+<td>Sparksee 5.1.1</td>
+<td>2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM</td>
+<td><a href="http://www.sparsity-technologies.com">Sparsity Technologies SA</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF10_sparksee.pdf">Full Disclosure Report</a></td>
+</tr>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">30</div></td>
+<td><div style="text-align:right!important; margin-left:0">1,287.17 ops/s</div></td>
+<td>20,212 EUR</td>
+<td>Virtuoso 07.50.3213 <a href="https://github.com/v7fasttrack/virtuoso-opensource">v7fasttrack</a></td>
+<td>2×Xeon2630 6-core 2.4GHz, 192GB RAM</td>
+<td><a href="http://www.openlinksw.com">OpenLink Software</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF30_virtuoso.pdf">Full Disclosure Report</a></td>
+</tr>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">30</div></td>
+<td><div style="text-align:right!important; margin-left:0">86.50 ops/s</div></td>
+<td>30,427 EUR</td>
+<td>Sparksee 5.1.1</td>
+<td>2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM</td>
+<td><a href="http://www.sparsity-technologies.com">Sparsity Technologies SA</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF30_sparksee.pdf">Full Disclosure Report</a></td>
+</tr>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">100</div></td>
+<td><div style="text-align:right!important; margin-left:0">1,200.00 ops/s</div></td>
+<td>20,212 EUR</td>
+<td>Virtuoso 07.50.3213 <a href="https://github.com/v7fasttrack/virtuoso-opensource">v7fasttrack</a></td>
+<td>2×Xeon2630 6-core 2.4GHz, 192GB RAM</td>
+<td><a href="http://www.openlinksw.com">OpenLink Software</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF100_virtuoso.pdf">Full Disclosure Report</a></td>
+</tr>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">100</div></td>
+<td><div style="text-align:right!important; margin-left:0">81.70 ops/s</div></td>
+<td>37,927 EUR</td>
+<td>Sparksee 5.1.1</td>
+<td>2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM</td>
+<td><a href="http://www.sparsity-technologies.com">Sparsity Technologies SA</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF100_sparksee.pdf">Full Disclosure Report</a></td>
+</tr>
+<tr>
+<td style="text-align:right"><div style="text-align:right!important">300</div></td>
+<td><div style="text-align:right!important; margin-left:0">635.00 ops/s</div></td>
+<td>20,212 EUR</td>
+<td>Virtuoso 07.50.3213 <a href="https://github.com/v7fasttrack/virtuoso-opensource">v7fasttrack</a></td>
+<td>2×Xeon2630 6-core 2.4GHz, 192GB RAM</td>
+<td><a href="http://www.openlinksw.com">OpenLink Software</a></td>
+<td><time style="white-space: nowrap">2015-04-27</time></td>
+<td><a href="../LDBC_SNB_I_20150427_SF300_virtuoso.pdf">Full Disclosure Report</a></td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/snb/index.html b/benchmarks/snb/index.html
new file mode 100644
index 00000000..7bf986fe
--- /dev/null
+++ b/benchmarks/snb/index.html
@@ -0,0 +1,370 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Social Network Benchmark (LDBC SNB)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Social Network Benchmark (LDBC SNB)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Social Network Benchmark (LDBC SNB)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>The Social Network Benchmark (SNB) suite defines graph workloads targeting database management systems and is maintained by the <a href="/benchmarks/snb/ldbc-snb-work-charter.pdf">LDBC SNB Task Force</a>.</p>
+<p>The benchmark suite consists of two distinct workloads on a common dataset:</p>
+<ul>
+<li>The <strong>Business Intelligence workload</strong> is focusing on aggregation- and join-heavy complex queries touching a large portion of the graph with microbatches of insert/delete operations. Its data sets are available in <a href="https://github.com/ldbc/ldbc_snb_bi/blob/main/snb-bi-pre-generated-data-sets.md">Cloudflare R2</a> and in the <a href="https://ldbcouncil.org/data-sets-surf-repository/snb-business-intelligence.html">SURF/CWI repository</a>.</li>
+<li>The <strong>Interactive workload</strong> captures transactional graph processing scenario with complex read queries that access the neighbourhood of a given node in the graph and update operations that continuously insert new data in the graph. Its data sets are available in the <a href="https://hdl.handle.net/11112/e6e00558-a2c3-9214-473e-04a16de09bf8">CWI/SURF data repository</a>.</li>
+</ul>
+<p>For a brief overview, see our <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">talk given at FOSDEM 2023&rsquo;s graph developer room</a>. The <a href="https://arxiv.org/pdf/2001.02299.pdf">Social Network Benchmark&rsquo;s specification</a> can be found on arXiv.</p>
+<h2 id="audited-results">Audited results</h2>
+<h4 id="-snb-business-intelligence-workloadbenchmarkssnb-bi"><a href="/benchmarks/snb-bi">– SNB Business Intelligence workload</a></h4>
+<h4 id="-snb-interactive-workloadbenchmarkssnb-interactive"><a href="/benchmarks/snb-interactive">– SNB Interactive workload</a></h4>
+<h3 id="commissioning-audits">Commissioning audits</h3>
+<p>For auditing requests, please reach out at <code>info@ldbcouncil.org</code>. Audits can only be commissioned by LDBC member companies by contracting any of the LDBC-certified auditors. Note that there is a 2,000 GBP auditing fee to be paid for the LDBC for non-sponsor company members. Sponsor companies are exempt from this.</p>
+<p>For a short summary of LDBC&rsquo;s auditing process, including preparation steps, timelines, and pricing, see the <a href="/docs/ldbc-snb-auditing-process.pdf">Auditing process for the LDBC Social Network Benchmark</a> document.</p>
+<h3 id="use-of-audited-results">Use of audited results</h3>
+<h4 id="fair-use-policies">Fair use policies</h4>
+<p>The LDBC Social Network Benchmark is subject to the <a href="/benchmarks/fair-use-policies">LDBC Fair Use Policies</a>.</p>
+<h4 id="retrospective-review-of-publications-related-to-ldbc-benchmark-standards">Retrospective review of publications related to LDBC benchmark standards</h4>
+<ul>
+<li><a href="retrospective-report-tigergraph.pdf">Review of 2019 preprint (sponsored by TigerGraph)</a></li>
+<li><a href="retrospective-report-oracle.pdf">Review of 2020 whitepaper (authored by Oracle)</a></li>
+<li><a href="retrospective-report-neo4j.pdf">Review of the keynote at NODES 2021 (Neo4j Online Developer Expo and Summit)</a></li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/snb/ldbc-snb-work-charter.pdf b/benchmarks/snb/ldbc-snb-work-charter.pdf
new file mode 100644
index 00000000..9743055c
Binary files /dev/null and b/benchmarks/snb/ldbc-snb-work-charter.pdf differ
diff --git a/benchmarks/snb/retrospective-report-neo4j.pdf b/benchmarks/snb/retrospective-report-neo4j.pdf
new file mode 100644
index 00000000..e99d9111
Binary files /dev/null and b/benchmarks/snb/retrospective-report-neo4j.pdf differ
diff --git a/benchmarks/snb/retrospective-report-oracle.pdf b/benchmarks/snb/retrospective-report-oracle.pdf
new file mode 100644
index 00000000..fddf907e
Binary files /dev/null and b/benchmarks/snb/retrospective-report-oracle.pdf differ
diff --git a/benchmarks/snb/retrospective-report-tigergraph.pdf b/benchmarks/snb/retrospective-report-tigergraph.pdf
new file mode 100644
index 00000000..8468fd07
Binary files /dev/null and b/benchmarks/snb/retrospective-report-tigergraph.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-1G-Virtuoso-09062015.pdf b/benchmarks/spb/LDBC-SPB-1G-Virtuoso-09062015.pdf
new file mode 100644
index 00000000..a46849c9
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-1G-Virtuoso-09062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-1G-Virtuoso-EC2-10062015.pdf b/benchmarks/spb/LDBC-SPB-1G-Virtuoso-EC2-10062015.pdf
new file mode 100644
index 00000000..def15fc9
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-1G-Virtuoso-EC2-10062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-256M-GraphDB-10062015.pdf b/benchmarks/spb/LDBC-SPB-256M-GraphDB-10062015.pdf
new file mode 100644
index 00000000..1b30a9ca
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-256M-GraphDB-10062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-256M-Virtuoso-09062015.pdf b/benchmarks/spb/LDBC-SPB-256M-Virtuoso-09062015.pdf
new file mode 100644
index 00000000..672c9cf7
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-256M-Virtuoso-09062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-256M-Virtuoso-EC2-10062015-v2.pdf b/benchmarks/spb/LDBC-SPB-256M-Virtuoso-EC2-10062015-v2.pdf
new file mode 100644
index 00000000..34ea9e86
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-256M-Virtuoso-EC2-10062015-v2.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-64M-GraphDB-10062015.pdf b/benchmarks/spb/LDBC-SPB-64M-GraphDB-10062015.pdf
new file mode 100644
index 00000000..b0d71274
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-64M-GraphDB-10062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-64M-Virtuoso-09062015.pdf b/benchmarks/spb/LDBC-SPB-64M-Virtuoso-09062015.pdf
new file mode 100644
index 00000000..e5d86326
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-64M-Virtuoso-09062015.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129-executive-summary.pdf b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129-executive-summary.pdf
new file mode 100644
index 00000000..58bf4f57
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129-executive-summary.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129.pdf b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129.pdf
new file mode 100644
index 00000000..8357aa61
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-cluster-20230129.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129-executive-summary.pdf b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129-executive-summary.pdf
new file mode 100644
index 00000000..74243ed5
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129-executive-summary.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129.pdf b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129.pdf
new file mode 100644
index 00000000..0c4ea85d
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF3-GraphDB-single-machine-20230129.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129-executive-summary.pdf b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129-executive-summary.pdf
new file mode 100644
index 00000000..74cbcea1
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129-executive-summary.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129.pdf b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129.pdf
new file mode 100644
index 00000000..e17d3bc4
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-cluster-20230129.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129-executive-summary.pdf b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129-executive-summary.pdf
new file mode 100644
index 00000000..e1e82e68
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129-executive-summary.pdf differ
diff --git a/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129.pdf b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129.pdf
new file mode 100644
index 00000000..d22954fb
Binary files /dev/null and b/benchmarks/spb/LDBC-SPB-SF5-GraphDB-single-machine-20230129.pdf differ
diff --git a/benchmarks/spb/LDBC_SPB20_20150426_SF1_GraphDB-EE-6.2b.pdf b/benchmarks/spb/LDBC_SPB20_20150426_SF1_GraphDB-EE-6.2b.pdf
new file mode 100644
index 00000000..dc61ff00
Binary files /dev/null and b/benchmarks/spb/LDBC_SPB20_20150426_SF1_GraphDB-EE-6.2b.pdf differ
diff --git a/benchmarks/spb/LDBC_SPB20_20150426_SF3_GraphDB-EE-6.2b.pdf b/benchmarks/spb/LDBC_SPB20_20150426_SF3_GraphDB-EE-6.2b.pdf
new file mode 100644
index 00000000..f4865212
Binary files /dev/null and b/benchmarks/spb/LDBC_SPB20_20150426_SF3_GraphDB-EE-6.2b.pdf differ
diff --git a/benchmarks/spb/index.html b/benchmarks/spb/index.html
new file mode 100644
index 00000000..a3bf413c
--- /dev/null
+++ b/benchmarks/spb/index.html
@@ -0,0 +1,598 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Semantic Publishing Benchmark (LDBC SPB)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Semantic Publishing Benchmark (LDBC-SPB)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Semantic Publishing Benchmark (LDBC-SPB)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>The Semantic Publishing Benchmark (SPB) is an LDBC benchmark for testing the performance of RDF engines inspired by the Media/Publishing industry. In particular, LDBC worked with British Broadcasting Corporation <a href="http://www.bbc.co.uk/blogs/internet/posts/Linked-Data-Connecting-together-the-BBCs-Online-Content">BBC</a> to define this benchmark, for which BBC donated workloads, <a href="https://github.com/ldbc/ldbc_spb_bm_2.0/tree/master/datasets_and_queries/ontologies">ontologies</a> and data. The publishing industry is an area where significant adoption of RDF is taking place.</p>
+<p>There have been many academic benchmarks for RDF but none of these are truly industrial-grade. The SPB  combines a set of complex queries under inference with continuous updates and special failover tests for systems implementing replication.</p>
+<p>SPB performance is measured by producing a workload of CRUD (Create, Read, Update, Delete) operations which are executed simultaneously. The benchmark offers a data generator that uses real reference data to produce datasets of various sizes and tests the scalability aspect of RDF systems. The benchmark workload consists of (a) editorial operations that add new data, alter or delete existing (b) aggregation operations that retrieve content according to various criteria. The benchmark also tests conformance for various rules inside the OWL2-RL rule-set.</p>
+<p>The <a href="ldbc-spb-v2.0-specification.pdf">SPB specification</a> contains the description of the benchmark and the data generator and all information about its software components can be found on the <a href="/developer/spb">SPB developer page</a>.</p>
+<h4 id="semantic-publishing-benchmark-spb-audited-results">Semantic Publishing Benchmark (SPB) Audited Results</h4>
+<table>
+<thead>
+<tr>
+<th><strong>SF</strong></th>
+<th><strong>Triples</strong></th>
+<th><strong>RW Agents</strong></th>
+<th><strong>Interactive (Q/sec)</strong></th>
+<th><strong>Updates (ops/sec)</strong></th>
+<th><strong>Cost</strong></th>
+<th><strong>Software</strong></th>
+<th><strong>Hardware</strong></th>
+<th><strong>Test Sponsor</strong></th>
+<th><strong>Date</strong></th>
+<th><strong>FDR</strong></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">16 / 4</div></td>
+<td><div style="text-align:right!important">335.48</div></td>
+<td><div style="text-align:right!important">25.66</div></td>
+<td><div style="text-align:right!important">177,474 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF3-GraphDB-single-machine-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF3-GraphDB-single-machine-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">24 / 0</div></td>
+<td><div style="text-align:right!important">413.16</div></td>
+<td><div style="text-align:right!important">0.00</div></td>
+<td><div style="text-align:right!important">207,474 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF3-GraphDB-single-machine-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF3-GraphDB-single-machine-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">64 / 4</div></td>
+<td><div style="text-align:right!important">1121.76</div></td>
+<td><div style="text-align:right!important">9.53</div></td>
+<td><div style="text-align:right!important">652,422 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>3×AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF3-GraphDB-cluster-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF3-GraphDB-cluster-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">64 / 0</div></td>
+<td><div style="text-align:right!important">985.63</div></td>
+<td><div style="text-align:right!important">0.00</div></td>
+<td><div style="text-align:right!important">562,422 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>3×AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF3-GraphDB-cluster-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF3-GraphDB-cluster-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">16 / 4</div></td>
+<td><div style="text-align:right!important">105.76</div></td>
+<td><div style="text-align:right!important">10.45</div></td>
+<td><div style="text-align:right!important">177,474 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF5-GraphDB-single-machine-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF5-GraphDB-single-machine-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">24 / 0</div></td>
+<td><div style="text-align:right!important">158.10</div></td>
+<td><div style="text-align:right!important">0.00</div></td>
+<td><div style="text-align:right!important">207,474 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF5-GraphDB-single-machine-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF5-GraphDB-single-machine-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">64 / 4</div></td>
+<td><div style="text-align:right!important">372.56</div></td>
+<td><div style="text-align:right!important">4.04</div></td>
+<td><div style="text-align:right!important">652,422 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>3×AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF5-GraphDB-cluster-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF5-GraphDB-cluster-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">64 / 0</div></td>
+<td><div style="text-align:right!important">408.68</div></td>
+<td><div style="text-align:right!important">0.00</div></td>
+<td><div style="text-align:right!important">562,422 USD</div></td>
+<td>GraphDB EE 10.0.1</td>
+<td>3×AWS r6id.8xlarge</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2023-01-29</time></td>
+<td><a href="LDBC-SPB-SF5-GraphDB-cluster-20230129.pdf">FDR</a>, <a href="LDBC-SPB-SF5-GraphDB-cluster-20230129-executive-summary.pdf">summary</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">1</div></td>
+<td><div style="text-align:right!important">64M</div></td>
+<td><div style="text-align:right!important">8 / 2</div></td>
+<td><div style="text-align:right!important">100.85</div></td>
+<td><div style="text-align:right!important">10.19</div></td>
+<td><div style="text-align:right!important">37,504 EUR</div></td>
+<td>GraphDB EE 6.2</td>
+<td>Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2015-04-26</time></td>
+<td><a href="LDBC_SPB20_20150426_SF1_GraphDB-EE-6.2b.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">1</div></td>
+<td><div style="text-align:right!important">64M</div></td>
+<td><div style="text-align:right!important">8 / 2</div></td>
+<td><div style="text-align:right!important">142.76</div></td>
+<td><div style="text-align:right!important">10.67</div></td>
+<td><div style="text-align:right!important">35,323 EUR</div></td>
+<td>GraphDB SE 6.3 alpha</td>
+<td>Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2015-06-10</time></td>
+<td><a href="LDBC-SPB-64M-GraphDB-10062015.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">8 / 2</div></td>
+<td><div style="text-align:right!important">29.90</div></td>
+<td><div style="text-align:right!important">9.50</div></td>
+<td><div style="text-align:right!important">37,504 EUR</div></td>
+<td>GraphDB EE 6.2</td>
+<td>Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2015-04-26</time></td>
+<td><a href="LDBC_SPB20_20150426_SF3_GraphDB-EE-6.2b.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">8 / 2</div></td>
+<td><div style="text-align:right!important">54.64</div></td>
+<td><div style="text-align:right!important">9.50</div></td>
+<td><div style="text-align:right!important">35,323 EUR</div></td>
+<td>GraphDB SE 6.3 alpha</td>
+<td>Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM</td>
+<td><a href="https://www.ontotext.com/">Ontotext AD</a></td>
+<td><time style="white-space: nowrap;">2015-06-10</time></td>
+<td><a href="LDBC-SPB-256M-GraphDB-10062015.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">1</div></td>
+<td><div style="text-align:right!important">64M</div></td>
+<td><div style="text-align:right!important">22 / 2</div></td>
+<td><div style="text-align:right!important">149.04</div></td>
+<td><div style="text-align:right!important">156.83</div></td>
+<td><div style="text-align:right!important">20,213 USD</div></td>
+<td>Virtuoso v7.50.3213</td>
+<td>Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM</td>
+<td><a href="http://www.openlinksw.com/">OpenLink Software</a></td>
+<td><time style="white-space: nowrap;">2015-06-09</time></td>
+<td><a href="LDBC-SPB-64M-Virtuoso-09062015.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">22 / 2</div></td>
+<td><div style="text-align:right!important">80.62</div></td>
+<td><div style="text-align:right!important">92.71</div></td>
+<td><div style="text-align:right!important">20,213 USD</div></td>
+<td>Virtuoso v7.50.3213</td>
+<td>Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM</td>
+<td><a href="http://www.openlinksw.com/">OpenLink Software</a></td>
+<td><time style="white-space: nowrap;">2015-06-09</time></td>
+<td><a href="LDBC-SPB-256M-Virtuoso-09062015.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">3</div></td>
+<td><div style="text-align:right!important">256M</div></td>
+<td><div style="text-align:right!important">30 / 3</div></td>
+<td><div style="text-align:right!important">115.38</div></td>
+<td><div style="text-align:right!important">109.85</div></td>
+<td><div style="text-align:right!important">24,528 USD</div></td>
+<td>Virtuoso v7.50.3213</td>
+<td>AWS r3.8xlarge</td>
+<td><a href="http://www.openlinksw.com/">OpenLink Software</a></td>
+<td><time style="white-space: nowrap;">2015-06-09</time></td>
+<td><a href="LDBC-SPB-256M-Virtuoso-EC2-10062015-v2.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">22 / 2</div></td>
+<td><div style="text-align:right!important">32.28</div></td>
+<td><div style="text-align:right!important">72.72</div></td>
+<td><div style="text-align:right!important">20,213 USD</div></td>
+<td>Virtuoso v7.50.3213</td>
+<td>Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM</td>
+<td><a href="http://www.openlinksw.com/">OpenLink Software</a></td>
+<td><time style="white-space: nowrap;">2015-06-09</time></td>
+<td><a href="LDBC-SPB-1G-Virtuoso-09062015.pdf">FDR</a></td>
+</tr>
+<tr>
+<td><div style="text-align:right!important">5</div></td>
+<td><div style="text-align:right!important">1B</div></td>
+<td><div style="text-align:right!important">30 / 3</div></td>
+<td><div style="text-align:right!important">45.81</div></td>
+<td><div style="text-align:right!important">55.45</div></td>
+<td><div style="text-align:right!important">24,528 USD</div></td>
+<td>Virtuoso v7.50.3213</td>
+<td>AWS r3.8xlarge</td>
+<td><a href="http://www.openlinksw.com/">OpenLink Software</a></td>
+<td><time style="white-space: nowrap;">2015-06-10</time></td>
+<td><a href="LDBC-SPB-1G-Virtuoso-EC2-10062015.pdf">FDR</a></td>
+</tr>
+</tbody>
+</table>
+<h4 id="ldbc-certified-auditors">LDBC-certified auditors</h4>
+<p>SPB audits can be commissioned from the following LDBC-certified auditors:</p>
+<ul>
+<li>Pjotr Scholtze</li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/benchmarks/spb/ldbc-spb-v2.0-specification.pdf b/benchmarks/spb/ldbc-spb-v2.0-specification.pdf
new file mode 100644
index 00000000..a91e5a91
Binary files /dev/null and b/benchmarks/spb/ldbc-spb-v2.0-specification.pdf differ
diff --git a/constitutional-documents/index.html b/constitutional-documents/index.html
new file mode 100644
index 00000000..2a991f42
--- /dev/null
+++ b/constitutional-documents/index.html
@@ -0,0 +1,362 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Constitutional Documents</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Constitutional Documents</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Constitutional Documents</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>This page contains LDBC&rsquo;s constitutional documents: its Articles of Association and Byelaws.</p>
+<h3 id="current-versions">Current versions</h3>
+<ul>
+<li><a href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf">Articles of Association (2023-03-30)</a></li>
+<li><a href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf">Byelaws (v1.5, 2024-01-12)</a></li>
+</ul>
+<h3 id="old-versions">Old versions</h3>
+<ul>
+<li><a href="/docs/LDBC.Articles.of.Association.ADOPTED.2021-01-14.pdf">Articles of Association (2021-01-14)</a></li>
+<li><a href="/docs/LDBC.Byelaws.1.4.ADOPTED.2023-05-02.pdf">Byelaws (v1.4, 2023-05-02)</a></li>
+<li><a href="/docs/LDBC.Byelaws.1.3.ADOPTED.2021-01-14.pdf">Byelaws (v1.3, 2021-01-14)</a></li>
+<li><a href="/docs/LDBC.Byelaws.1.2.ADOPTED.2020-07-28.pdf">Byelaws (v1.2, 2020-07-28)</a></li>
+<li><a href="/docs/LDBC.Byelaws.1.1.ADOPTED.2017-03-02.pdf">Byelaws (v1.1, 2017-03-02)</a></li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/css/custom-style.css b/css/custom-style.css
new file mode 100644
index 00000000..e69de29b
diff --git a/data/snb_bi.csv b/data/snb_bi.csv
new file mode 100644
index 00000000..158aabf3
--- /dev/null
+++ b/data/snb_bi.csv
@@ -0,0 +1,6 @@
+date|test_sponsor_name|test_sponsor_url|software_name|software_version|software_url|specification_version|specification_url|driver_version|driver_url|full_disclosure_report|executive_summary|signatures|supplementary_package|query_implementation|scale_factor|power_at_sf|power_at_sf_price_adjusted|throughput_at_sf|throughput_at_sf_price_adjusted|price|currency|hardware
+2023-12-03|TuGraph, Ant Yunchuang Digital Technology (Beijing) Co., Ltd.|https://www.tugraph.org/|TuGraph|0.9|https://www.tugraph.org/|2.2.2|https://arxiv.org/pdf/2001.02299v7.pdf|1.0.3|https://github.com/ldbc/ldbc_snb_bi/releases/tag/v1.0.3|LDBC_SNB_BI_20231203_SF30000_tugraph.pdf|LDBC_SNB_BI_20231203_SF30000_tugraph-executive_summary.pdf|LDBC_SNB_BI_20231203_SF30000_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20231203_SF30000_tugraph-attachments.tar.gz|Gremlin|30000|111775.39|19.79|56920.48|10.08|5649500|USD|72 Alibaba Cloud ecs.r7.16xlarge instances: 64×Intel Xeon Platinum 8369B vCPUs,  512 GiB RAM per instance
+2023-04-06|TigerGraph|https://tigergraph.com/|TigerGraph|3.7.0|https://docs.tigergraph.com/tigergraph-server/3.7|2.2.0|https://arxiv.org/pdf/2001.02299v7.pdf|1.0.3|https://github.com/ldbc/ldbc_snb_bi/releases/tag/v1.0.3|LDBC_SNB_BI_20230406_SF100_tigergraph.pdf|LDBC_SNB_BI_20230406_SF100_tigergraph-executive_summary.pdf|LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz|GSQL|100|6253.72|43.79|3723.44|26.07|142815|USD|1 AWS r6a.4xlarge instance: 16×AMD EPYC 7R13 vCPUs, 128GiB RAM
+2023-04-06|TigerGraph|https://tigergraph.com/|TigerGraph|3.7.0|https://docs.tigergraph.com/tigergraph-server/3.7|2.2.0|https://arxiv.org/pdf/2001.02299v7.pdf|1.0.3|https://github.com/ldbc/ldbc_snb_bi/releases/tag/v1.0.3|LDBC_SNB_BI_20230406_SF1000_tigergraph.pdf|LDBC_SNB_BI_20230406_SF1000_tigergraph-executive_summary.pdf|LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz|GSQL|1000|23951.74|18.39|10605.12|8.14|1302174|USD|4 AWS r6a.8xlarge instances: 32×AMD EPYC 7R13 vCPUs, 256GiB RAM per instance
+2023-04-06|TigerGraph|https://tigergraph.com/|TigerGraph|3.7.0|https://docs.tigergraph.com/tigergraph-server/3.7|2.2.0|https://arxiv.org/pdf/2001.02299v7.pdf|1.0.3|https://github.com/ldbc/ldbc_snb_bi/releases/tag/v1.0.3|LDBC_SNB_BI_20230406_SF10000_tigergraph.pdf|LDBC_SNB_BI_20230406_SF10000_tigergraph-executive_summary.pdf|LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20230406_SF100_SF1000_SF10000_tigergraph-attachments.tar.gz|GSQL|10000|89444.50|11.36|41025.76|5.21|7871354|USD|48 AWS r6a.8xlarge instances: 32×AMD EPYC 7R13 vCPUs, 256GiB RAM per instance
+2022-11-09|TigerGraph|https://tigergraph.com/|TigerGraph|3.7.0|https://docs.tigergraph.com/tigergraph-server/3.7|2.2.0|https://arxiv.org/pdf/2001.02299v7.pdf|1.0.2|https://github.com/ldbc/ldbc_snb_bi/releases/tag/v1.0.2|LDBC_SNB_BI_20221109_SF1000_tigergraph.pdf|LDBC_SNB_BI_20221109_SF1000_tigergraph-executive_summary.pdf|LDBC_SNB_BI_20221109_SF1000_tigergraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_BI_20221109_SF1000_tigergraph-attachments.tar.gz|GSQL|1000|30990.08|22.90|12993.85|9.60|1353315|USD|Dell PowerEdge 6625 with 64×AMD EPYC 9354 CPU cores and 1.5TiB RAM
diff --git a/data/snb_interactive.csv b/data/snb_interactive.csv
new file mode 100644
index 00000000..a1b22ff7
--- /dev/null
+++ b/data/snb_interactive.csv
@@ -0,0 +1,25 @@
+date|category|test_sponsor_name|test_sponsor_url|software_name|software_version|software_url|specification_version|specification_url|driver_version|driver_url|full_disclosure_report|executive_summary|signatures|supplementary_package|throughput_at_largest_sf|query_implementation|scale_factor|throughput|price|currency|hardware
+2024-05-14|imperative|Alibaba Cloud|https://www.alibabacloud.com/|GraphScope Flex|0.26.1|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz|127784.51|C++ stored procedures|100|130098.36|738724|RMB|Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs
+2024-05-14|imperative|Alibaba Cloud|https://www.alibabacloud.com/|GraphScope Flex|0.26.1|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz|127784.51|C++ stored procedures|300|131263.87|738724|RMB|Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs
+2024-05-14|imperative|Alibaba Cloud|https://www.alibabacloud.com/|GraphScope Flex|0.26.1|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf|LDBC_SNB_I_20240514_SF100-300-1000_graphscope-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz|127784.51|C++ stored procedures|1000|127784.51|738724|RMB|Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs
+2023-12-25|imperative|StarGraph|https://www.stargraph.cn/|AtlasGraph|3.0.0|https://atlasgraph.io/|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-attachments.tar.gz|48311.63|Rust stored procedures|30|37631.25|2032461|RMB|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2023-12-25|imperative|StarGraph|https://www.stargraph.cn/|AtlasGraph|3.0.0|https://atlasgraph.io/|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-attachments.tar.gz|48311.63|Rust stored procedures|100|48764.08|2032461|RMB|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2023-12-25|imperative|StarGraph|https://www.stargraph.cn/|AtlasGraph|3.0.0|https://atlasgraph.io/|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-executive_summary.pdf|LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20231225_SF30-100-300_AtlasGraph-attachments.tar.gz|48311.63|Rust stored procedures|300|48311.63|2032461|RMB|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2023-07-13|imperative|Alibaba DAMO Academy|https://damo.alibaba.com/|GraphScope Flex|0.23.0|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230713_SF30-100-300_GraphscopeFlex-attachments.tar.gz|33261.38|C++ stored procedures|30|33180.87|99236|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2023-07-13|imperative|Alibaba DAMO Academy|https://damo.alibaba.com/|GraphScope Flex|0.23.0|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230713_SF30-100-300_GraphscopeFlex-attachments.tar.gz|33261.38|C++ stored procedures|100|33625.36|99236|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2023-07-13|imperative|Alibaba DAMO Academy|https://damo.alibaba.com/|GraphScope Flex|0.23.0|https://github.com/alibaba/GraphScope|0.3.6|https://arxiv.org/pdf/2001.02299v1.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-executive_summary.pdf|LDBC_SNB_I_20230713_SF30-100-300_GraphScopeFlex-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230713_SF30-100-300_GraphscopeFlex-attachments.tar.gz|33261.38|C++ stored procedures|300|33261.38|99236|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2023-01-31|declarative|Ontotext|https://www.ontotext.com/|GraphDB|10.1.1|https://graphdb.ontotext.com/|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230131_SF30_graphdb.pdf|LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf|LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230131_SF30_graphdb-attachments.tar.gz|12.16|SPARQL|30|3.04|216222|USD|AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 1 read thread, 1 write thread
+2023-01-31|declarative|Ontotext|https://www.ontotext.com/|GraphDB|10.1.1|https://graphdb.ontotext.com/|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230131_SF30_graphdb.pdf|LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf|LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230131_SF30_graphdb-attachments.tar.gz|12.16|SPARQL|30|6.76|216222|USD|AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 2 read threads, 2 write threads
+2023-01-31|declarative|Ontotext|https://www.ontotext.com/|GraphDB|10.1.1|https://graphdb.ontotext.com/|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230131_SF30_graphdb.pdf|LDBC_SNB_I_20230131_SF30_graphdb-executive_summary.pdf|LDBC_SNB_I_20230131_SF30_graphdb-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230131_SF30_graphdb-attachments.tar.gz|12.16|SPARQL|30|12.16|216222|USD|AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 4 read threads, 4 write threads
+2022-08-16|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.2.0|https://tech.antfin.com/products/TuGraph|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20200726_SF30-100-300_tugraph-attachments.tar.gz|12721.24|C++ stored procedures|30|12252.50|291176|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2022-08-16|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.2.0|https://tech.antfin.com/products/TuGraph|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20200726_SF30-100-300_tugraph-attachments.tar.gz|12721.24|C++ stored procedures|100|12934.61|291176|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2022-08-16|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.2.0|https://tech.antfin.com/products/TuGraph|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20220816_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20220816_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20200726_SF30-100-300_tugraph-attachments.tar.gz|12721.24|C++ stored procedures|300|12721.24|291176|USD|AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2022-05-16|imperative|CreateLink|https://galaxybase.com/|Galaxybase|3.3.0|https://galaxybase.com/|0.3.3|https://arxiv.org/pdf/2001.02299v2.pdf|0.3.4|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.4|LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-attachments.tar.gz|8370.52|Java stored procedures|30|9285.86|263282|USD|AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2022-05-16|imperative|CreateLink|https://galaxybase.com/|Galaxybase|3.3.0|https://galaxybase.com/|0.3.3|https://arxiv.org/pdf/2001.02299v2.pdf|0.3.4|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.4|LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-attachments.tar.gz|8370.52|Java stored procedures|100|8501.21|263282|USD|AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2022-05-16|imperative|CreateLink|https://galaxybase.com/|Galaxybase|3.3.0|https://galaxybase.com/|0.3.3|https://arxiv.org/pdf/2001.02299v2.pdf|0.3.4|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.4|LDBC_SNB_I_20220516_SF30-100-300_galaxybase.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-executive_summary.pdf|LDBC_SNB_I_20220516_SF30-100-300_galaxybase-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220516_SF30-100-300_galaxybase-attachments.tar.gz|8370.52|Java stored procedures|300|8370.52|263282|USD|AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs
+2020-07-26|imperative|FMA|https://fma-ai.cn/|TuGraph|1.1|https://fma-ai.cn/|0.3.2|https://arxiv.org/pdf/2001.02299v1.pdf|0.3.3|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.3|LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220816_SF30-100-300_tugraph-attachments.tar.gz|4855.52|C++ stored procedures|30|5436.47|280650|USD|AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2020-07-26|imperative|FMA|https://fma-ai.cn/|TuGraph|1.1|https://fma-ai.cn/|0.3.2|https://arxiv.org/pdf/2001.02299v1.pdf|0.3.3|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.3|LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220816_SF30-100-300_tugraph-attachments.tar.gz|4855.52|C++ stored procedures|100|5010.77|280650|USD|AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2020-07-26|imperative|FMA|https://fma-ai.cn/|TuGraph|1.1|https://fma-ai.cn/|0.3.2|https://arxiv.org/pdf/2001.02299v1.pdf|0.3.3|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/0.3.3|LDBC_SNB_I_20200726_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20200726_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20220816_SF30-100-300_tugraph-attachments.tar.gz|4855.52|C++ stored procedures|300|4855.52|280650|USD|AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs
+2023-01-28|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.3.4|https://github.com/tugraph-db/tugraph-db|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230128_SF30-100-300_tugraph-attachments.tar.gz|13532.62|C++ stored procedures|30|16133.08|277542|RMB|Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs
+2023-01-28|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.3.4|https://github.com/tugraph-db/tugraph-db|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230128_SF30-100-300_tugraph-attachments.tar.gz|13532.62|C++ stored procedures|100|16966.26|277542|RMB|Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs
+2023-01-28|imperative|Ant Group|https://www.antgroup.com/en|TuGraph|3.3.4|https://github.com/tugraph-db/tugraph-db|0.3.6|https://arxiv.org/pdf/2001.02299v3.pdf|1.2.0|https://github.com/ldbc/ldbc_snb_interactive_v1_driver/releases/tag/v1.2.0|LDBC_SNB_I_20230128_SF30-100-300_tugraph.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-executive_summary.pdf|LDBC_SNB_I_20230128_SF30-100-300_tugraph-signatures.pdf|https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20230128_SF30-100-300_tugraph-attachments.tar.gz|13532.62|C++ stored procedures|300|13532.62|277542|RMB|Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs
diff --git a/developer-community/index.html b/developer-community/index.html
new file mode 100644
index 00000000..ffe74715
--- /dev/null
+++ b/developer-community/index.html
@@ -0,0 +1,353 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Developer Community</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Developer Community</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Developer Community</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>If you are interested in joining our benchmark task forces, please reach out at <code>info@ldbcouncil.org</code>.</p>
+<h3 id="licensing">Licensing</h3>
+<p>Our benchmarks are licensed under the Apache Software License, Version 2.0 (<a href="/licensing/LICENSE.txt">license file</a>, <a href="/licensing/NOTICE.txt">notice file</a>).</p>
+<h3 id="contributor-license-agreement">Contributor License Agreement</h3>
+<p>To contribute to the LDBC repositories, we ask you to <a href="/becoming-a-member">sign a CLA or become an LDBC member</a>. These options are available for both individuals and organizations.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/developer/finbench/index.html b/developer/finbench/index.html
new file mode 100644
index 00000000..588fa8b8
--- /dev/null
+++ b/developer/finbench/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/finbench/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/finbench/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/finbench/">
+  </head>
+</html>
diff --git a/developer/snb/index.html b/developer/snb/index.html
new file mode 100644
index 00000000..722eb105
--- /dev/null
+++ b/developer/snb/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/snb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/snb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/snb/">
+  </head>
+</html>
diff --git a/developer/spb/index.html b/developer/spb/index.html
new file mode 100644
index 00000000..b1746b28
--- /dev/null
+++ b/developer/spb/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/spb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/spb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/spb/">
+  </head>
+</html>
diff --git a/docs/LDBC Byelaws.1.5.ADOPTED.2024-01-12.pdf b/docs/LDBC Byelaws.1.5.ADOPTED.2024-01-12.pdf
new file mode 100644
index 00000000..dfe92997
Binary files /dev/null and b/docs/LDBC Byelaws.1.5.ADOPTED.2024-01-12.pdf differ
diff --git a/docs/LDBC.Articles.of.Association.ADOPTED.2021-01-14.pdf b/docs/LDBC.Articles.of.Association.ADOPTED.2021-01-14.pdf
new file mode 100644
index 00000000..cfbc0f83
Binary files /dev/null and b/docs/LDBC.Articles.of.Association.ADOPTED.2021-01-14.pdf differ
diff --git a/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf b/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf
new file mode 100644
index 00000000..284c51d2
Binary files /dev/null and b/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf differ
diff --git a/docs/LDBC.Byelaws.1.1.ADOPTED.2017-03-02.pdf b/docs/LDBC.Byelaws.1.1.ADOPTED.2017-03-02.pdf
new file mode 100644
index 00000000..da96ef26
Binary files /dev/null and b/docs/LDBC.Byelaws.1.1.ADOPTED.2017-03-02.pdf differ
diff --git a/docs/LDBC.Byelaws.1.2.ADOPTED.2020-07-28.pdf b/docs/LDBC.Byelaws.1.2.ADOPTED.2020-07-28.pdf
new file mode 100644
index 00000000..2416cbb1
Binary files /dev/null and b/docs/LDBC.Byelaws.1.2.ADOPTED.2020-07-28.pdf differ
diff --git a/docs/LDBC.Byelaws.1.3.ADOPTED.2021-01-14.pdf b/docs/LDBC.Byelaws.1.3.ADOPTED.2021-01-14.pdf
new file mode 100644
index 00000000..9800be11
Binary files /dev/null and b/docs/LDBC.Byelaws.1.3.ADOPTED.2021-01-14.pdf differ
diff --git a/docs/LDBC.Byelaws.1.4.ADOPTED.2023-05-02.pdf b/docs/LDBC.Byelaws.1.4.ADOPTED.2023-05-02.pdf
new file mode 100644
index 00000000..b4e7f658
Binary files /dev/null and b/docs/LDBC.Byelaws.1.4.ADOPTED.2023-05-02.pdf differ
diff --git a/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf b/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf
new file mode 100644
index 00000000..dfe92997
Binary files /dev/null and b/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf differ
diff --git a/docs/LDBC.Individual.Contributor.License.Agreement.Form-2020-10-23.pdf b/docs/LDBC.Individual.Contributor.License.Agreement.Form-2020-10-23.pdf
new file mode 100644
index 00000000..7f84e331
Binary files /dev/null and b/docs/LDBC.Individual.Contributor.License.Agreement.Form-2020-10-23.pdf differ
diff --git a/docs/LDBC.Membership--Joining.and.Renewing.(August.2023).pdf b/docs/LDBC.Membership--Joining.and.Renewing.(August.2023).pdf
new file mode 100644
index 00000000..b826fd39
Binary files /dev/null and b/docs/LDBC.Membership--Joining.and.Renewing.(August.2023).pdf differ
diff --git a/docs/LDBC.Membership.-.Joining.and.Renewing.2022.pdf b/docs/LDBC.Membership.-.Joining.and.Renewing.2022.pdf
new file mode 100644
index 00000000..7c7b9c28
Binary files /dev/null and b/docs/LDBC.Membership.-.Joining.and.Renewing.2022.pdf differ
diff --git a/docs/LDBC.Membership.Application.and.Renewal.Form.2021-01-14.pdf b/docs/LDBC.Membership.Application.and.Renewal.Form.2021-01-14.pdf
new file mode 100644
index 00000000..aea7ecf4
Binary files /dev/null and b/docs/LDBC.Membership.Application.and.Renewal.Form.2021-01-14.pdf differ
diff --git a/docs/LDBC.Membership.Application_Renewal.Form.and.incorporated.Membership.Agreement.(August.2023).pdf b/docs/LDBC.Membership.Application_Renewal.Form.and.incorporated.Membership.Agreement.(August.2023).pdf
new file mode 100644
index 00000000..d5dd797c
Binary files /dev/null and b/docs/LDBC.Membership.Application_Renewal.Form.and.incorporated.Membership.Agreement.(August.2023).pdf differ
diff --git a/docs/LDBC.Organization.Contributor.License.Agreement.Form-2020-10-23.pdf b/docs/LDBC.Organization.Contributor.License.Agreement.Form-2020-10-23.pdf
new file mode 100644
index 00000000..253b6776
Binary files /dev/null and b/docs/LDBC.Organization.Contributor.License.Agreement.Form-2020-10-23.pdf differ
diff --git a/docs/ldbc-benchmark-specification-process.pdf b/docs/ldbc-benchmark-specification-process.pdf
new file mode 100644
index 00000000..1f481928
Binary files /dev/null and b/docs/ldbc-benchmark-specification-process.pdf differ
diff --git a/docs/ldbc-snb-auditing-process.pdf b/docs/ldbc-snb-auditing-process.pdf
new file mode 100644
index 00000000..b56eaaf6
Binary files /dev/null and b/docs/ldbc-snb-auditing-process.pdf differ
diff --git a/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf
new file mode 100644
index 00000000..324fec17
Binary files /dev/null and b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf differ
diff --git a/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf
new file mode 100644
index 00000000..899cbad5
Binary files /dev/null and b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf differ
diff --git a/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf
new file mode 100644
index 00000000..e5a385e4
Binary files /dev/null and b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf differ
diff --git a/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf
new file mode 100644
index 00000000..14cb184a
Binary files /dev/null and b/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf differ
diff --git a/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf b/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf
new file mode 100644
index 00000000..0b499494
Binary files /dev/null and b/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf differ
diff --git a/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf b/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf
new file mode 100644
index 00000000..eeb23d0d
Binary files /dev/null and b/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf differ
diff --git a/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf b/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf
new file mode 100644
index 00000000..d7052b00
Binary files /dev/null and b/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf differ
diff --git a/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf b/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf
new file mode 100644
index 00000000..9d14c247
Binary files /dev/null and b/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf differ
diff --git a/docs/papers/datagen-deletes-grades-nda-2020.pdf b/docs/papers/datagen-deletes-grades-nda-2020.pdf
new file mode 100644
index 00000000..1900a604
Binary files /dev/null and b/docs/papers/datagen-deletes-grades-nda-2020.pdf differ
diff --git a/docs/papers/ldbc-acid-tpctc2020.pdf b/docs/papers/ldbc-acid-tpctc2020.pdf
new file mode 100644
index 00000000..19044a2b
Binary files /dev/null and b/docs/papers/ldbc-acid-tpctc2020.pdf differ
diff --git a/docs/papers/ldbc-organization-tpctc2023-preprint.pdf b/docs/papers/ldbc-organization-tpctc2023-preprint.pdf
new file mode 100644
index 00000000..f4e61661
Binary files /dev/null and b/docs/papers/ldbc-organization-tpctc2023-preprint.pdf differ
diff --git a/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf b/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf
new file mode 100644
index 00000000..272aad49
Binary files /dev/null and b/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf differ
diff --git a/docs/papers/ldbc-snb-bi-vldb-2022.pdf b/docs/papers/ldbc-snb-bi-vldb-2022.pdf
new file mode 100644
index 00000000..cd354e6c
Binary files /dev/null and b/docs/papers/ldbc-snb-bi-vldb-2022.pdf differ
diff --git a/docs/papers/ldbc-snb-bi-vldb-2023.pdf b/docs/papers/ldbc-snb-bi-vldb-2023.pdf
new file mode 100644
index 00000000..cd354e6c
Binary files /dev/null and b/docs/papers/ldbc-snb-bi-vldb-2023.pdf differ
diff --git a/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf b/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf
new file mode 100644
index 00000000..bf76ed84
Binary files /dev/null and b/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf differ
diff --git a/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf b/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf
new file mode 100644
index 00000000..533f885d
Binary files /dev/null and b/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf differ
diff --git a/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf b/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf
new file mode 100644
index 00000000..ead0d1e7
Binary files /dev/null and b/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf differ
diff --git a/docs/papers/parameter-curation-tpctc2014.pdf b/docs/papers/parameter-curation-tpctc2014.pdf
new file mode 100644
index 00000000..6d58915f
Binary files /dev/null and b/docs/papers/parameter-curation-tpctc2014.pdf differ
diff --git a/docs/papers/s3g2-scalable-data-generator-tpctc2012.pdf b/docs/papers/s3g2-scalable-data-generator-tpctc2012.pdf
new file mode 100644
index 00000000..e9b1578a
Binary files /dev/null and b/docs/papers/s3g2-scalable-data-generator-tpctc2012.pdf differ
diff --git a/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf b/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf
new file mode 100644
index 00000000..69eb527e
Binary files /dev/null and b/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf differ
diff --git a/docs/papers/w16045-prepub-LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.pdf b/docs/papers/w16045-prepub-LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.pdf
new file mode 100644
index 00000000..77854124
Binary files /dev/null and b/docs/papers/w16045-prepub-LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.pdf differ
diff --git a/docs/presentations/graph-databases-2021-11.pdf b/docs/presentations/graph-databases-2021-11.pdf
new file mode 100644
index 00000000..eac7b460
Binary files /dev/null and b/docs/presentations/graph-databases-2021-11.pdf differ
diff --git a/docs/presentations/ldbc-snb-2021-12.pdf b/docs/presentations/ldbc-snb-2021-12.pdf
new file mode 100644
index 00000000..9cbc43e5
Binary files /dev/null and b/docs/presentations/ldbc-snb-2021-12.pdf differ
diff --git a/docs/presentations/ldbc-snb-2022-11.pdf b/docs/presentations/ldbc-snb-2022-11.pdf
new file mode 100644
index 00000000..9aec9e54
Binary files /dev/null and b/docs/presentations/ldbc-snb-2022-11.pdf differ
diff --git a/docs/presentations/tpctc-2023-ldbc-linked-data-benchmark-council-organization.pdf b/docs/presentations/tpctc-2023-ldbc-linked-data-benchmark-council-organization.pdf
new file mode 100644
index 00000000..d7e2c872
Binary files /dev/null and b/docs/presentations/tpctc-2023-ldbc-linked-data-benchmark-council-organization.pdf differ
diff --git a/docs/presentations/tpctc-2023-ldbc-snb-interactive-v2.pdf b/docs/presentations/tpctc-2023-ldbc-snb-interactive-v2.pdf
new file mode 100644
index 00000000..7a1d7d5e
Binary files /dev/null and b/docs/presentations/tpctc-2023-ldbc-snb-interactive-v2.pdf differ
diff --git a/docs/presentations/vldb-2023-ldbc-snb-bi-slides-szarnyasg.pdf b/docs/presentations/vldb-2023-ldbc-snb-bi-slides-szarnyasg.pdf
new file mode 100644
index 00000000..bd45750d
Binary files /dev/null and b/docs/presentations/vldb-2023-ldbc-snb-bi-slides-szarnyasg.pdf differ
diff --git a/docs/tuc17th/duckpgq.pdf b/docs/tuc17th/duckpgq.pdf
new file mode 100644
index 00000000..fce8d914
Binary files /dev/null and b/docs/tuc17th/duckpgq.pdf differ
diff --git a/event/eighteenth-tuc-meeting/index.html b/event/eighteenth-tuc-meeting/index.html
new file mode 100644
index 00000000..bb61b45e
--- /dev/null
+++ b/event/eighteenth-tuc-meeting/index.html
@@ -0,0 +1,476 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Eighteenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Eighteenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Eighteenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Shipeng Qi</strong> / on <strong class="text-dark">24 Apr 2024</strong></div>
+        
+        
+        
+        <h5>
+          Location: Guangzhou
+        </h5>
+        <h5>
+          
+          Event dates: 30 Aug 2024 09:00 -- 31 Aug 2024 18:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p><strong>Organizers:</strong> Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located in <strong>Guangzhou</strong> with <a href="https://vldb.org/2024/">VLDB 2024</a> on <strong>August 30-31 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/aVPrrcxXpSwrWPnh6">our form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in PDT.</strong></p>
+<h4 id="august-30-friday">August 30, Friday</h4>
+<p><strong>Location:</strong> <a href="https://www.langhamhotels.com/en/the-langham/guangzhou/">Langham Place</a>, Guangzhou, <strong>room 1</strong>,<br>
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map <a href="https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36">here</a>.</p>
+<p><strong>Agenda:</strong> TBA</p>
+<h4 id="august-31-saturday">August 31, Saturday</h4>
+<p><strong>Location:</strong> Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map <a href="https://maps.app.goo.gl/HgEVafZMRmrzUsgW8">here</a>.</p>
+<p><strong>Agenda:</strong> TBA</p>
+<h4 id="tuc-event-locations">TUC event locations</h4>
+<p>A <a href="https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo">map of the LDBC TUC events</a> we hosted so far.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/eighth-tuc-meeting/index.html b/event/eighth-tuc-meeting/index.html
new file mode 100644
index 00000000..8687a053
--- /dev/null
+++ b/event/eighth-tuc-meeting/index.html
@@ -0,0 +1,582 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Eighth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Eighth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Eighth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Damaris Coll</strong> / on <strong class="text-dark">22 Jun 2016</strong></div>
+        
+        
+        
+        <h5>
+          Location: Oracle Conference Center in Redwood Shores (CA) US
+        </h5>
+        <h5>
+          
+          Event dates: 22 Jun 2016 14:45 -- 23 Jun 2016 14:45  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event/eighth-tuc-meeting/attachments at <a href="http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf">Oracle Conference Center</a> in Redwood Shores facility on <strong>Wednesday and Thursday June 22-23, 2016</strong>.</p>
+<p>This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:</p>
+<ul>
+<li>Two day event/eighth-tuc-meeting/attachments with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the benchmarking results for the different benchmarks.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a>; in order to notify Oracle security in advance, registration requests need to be in by <strong>June 12</strong>.</p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.</p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.</p>
+<p>In this page, you&rsquo;ll find information about the following items:</p>
+<ul>
+<li><a href="#agenda">Agenda</a></li>
+<li><a href="#logistics">Logistics</a>
+<ul>
+<li><a href="#date">Date</a></li>
+<li><a href="#venue">Venue</a></li>
+<li><a href="#getting-there">Getting there</a></li>
+</ul>
+</li>
+<li><a href="#accommodation">Accommodation</a></li>
+</ul>
+<h3 id="agenda">Agenda</h3>
+<p>On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.</p>
+<h6 id="wednesday-22th-of-june-2016-room-203"><strong>Wednesday, 22th of June 2016 (<strong>Room 203)</strong></strong></h6>
+<p>(full morning: LDBC Board of Directors meeting)</p>
+<ul>
+<li>12:00 - 13:00 Lunch (provided)</li>
+<li>13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.</li>
+<li>13:30 - 14:00 Peter Boncz (CWI) <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf">LDBC introduction and status update</a>.</li>
+<li>14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)</li>
+<li>14:00 Arnau Prat (DAMA-UPC). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf">Social Network Benchmark, Interactive workload</a>.</li>
+<li>14:30 Tim Hegeman (TU Delft). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf">Social Network Benchmark, Analytics workload</a>.</li>
+<li>15:00 - 15:30 Coffee break</li>
+<li>15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+<ul>
+<li>15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf">Graphing Healthcare Networks: Data, Analytics, and Use Cases.</a></li>
+<li>16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf">Frappé: Querying and managing evolving code dependency graphs</a>.</li>
+<li>16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf">UniProt: challenges of a public SPARQL endpoint.</a></li>
+</ul>
+</li>
+<li>17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+<ul>
+<li>17:00 Eugene I. Chong (Oracle USA). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf">Balancing Act to improve RDF Query Performance in Oracle Database</a>.</li>
+<li>17:30 Lijun Chang (University of New South Wales). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf">Efficient Subgraph Matching by Postponing Cartesian Products</a>.</li>
+<li>18:00 Weining Qian (East China Normal University). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf">On Statistical Characteristics of Real-Life Knowledge Graphs</a>.</li>
+</ul>
+</li>
+</ul>
+<h6 id="thursday-23th-of-june-2016-room-203"><strong>Thursday, 23th of June 2016 (Room 203)</strong></h6>
+<ul>
+<li>08:00 - 09:00 Breakfast (provided)</li>
+<li>09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+<ul>
+<li>09:00 Peter Boncz (CWI). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf">Query Language Task Force status</a></li>
+<li>09:45 Marcus Paradies (SAP). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf">Social Network Benchmark, Business Intelligence workload</a></li>
+</ul>
+</li>
+<li>10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+<ul>
+<li>10:00 Sergey Edunov (Facebook). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf">Generating realistic trillion-edge graphs</a></li>
+<li>10:30 George Fletcher (TU Eindhoven). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf">An open source framework for schema-driven graph instance and graph query workload generation</a>.</li>
+<li>11:00 Yinglong Xia (Huawei Research America): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf">An Efficient Big Graph Analytics Platform</a>.</li>
+<li>11:30 Zhe Wu (Oracle USA). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf">Bridging RDF Graph and Property Graph Data Models</a></li>
+</ul>
+</li>
+<li>12:00 - 13:30 Lunch (provided)</li>
+<li>13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+<ul>
+<li>13:30 Tobias Lindaaker (Neo Technology). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf">An open standard for graph queries: the Cypher contribution</a></li>
+<li>14:00 Arash Termehchy (Oregon State University). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf">Toward Representation Independent Graph Querying &amp; Analytics</a></li>
+<li>14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf">In the service of the federation</a></li>
+<li>15:00 Nandish Jayaram (Pivotal). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf">Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs</a>.</li>
+</ul>
+</li>
+<li>15:30 - 16:00 Coffee break</li>
+<li>16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+<ul>
+<li>16:00 Jans Aasman (Franz Inc.). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf">Semantic Data Lake for Healthcare</a></li>
+<li>16:15 Kevin Madden (Tom Sawyer Software). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf">Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis</a></li>
+<li>16:45 Juan Sequeda (Capsenta). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf">Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources</a></li>
+<li>17:15 Kevin Wilkinson (Hewlett Packard Labs). <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf">LDBC SNB extensions</a></li>
+</ul>
+</li>
+<li>17:45 - 18:15 Closing discussion</li>
+</ul>
+<h6 id="friday-24th-of-june-2016-room-105"><strong>Friday, 24th of June 2016 (Room 105)</strong></h6>
+<p>At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (<strong>GRADES16</strong>).</p>
+<p>18:30 social dinner for GRADES registrants (place to be announced)</p>
+<h3 id="logistics">Logistics</h3>
+<h6 id="date"><strong>Date</strong></h6>
+<p>22nd and 23rd June 2016</p>
+<h6 id="venue"><strong>Venue</strong></h6>
+<p>The TUC meeting will be held in the <a href="http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf">Oracle Conference Center</a></p>
+<p>The address is:</p>
+<p><strong>Room 203 (Wed-Thu) &amp; Room 105 (Fri)</strong><br>
+<strong>Oracle Conference Center</strong><br>
+<strong>350 Oracle Parkway</strong><br>
+<strong>Redwood City, CA 94065, USA</strong></p>
+<p><strong>Maps and situation</strong></p>
+<p><a href="https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91">Google Maps link</a></p>
+<p>Oracle Campus map:</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg" alt=""></p>
+<h5 id="getting-there"><strong>Getting there</strong></h5>
+<h6 id="driving-directions"><strong>Driving directions</strong></h6>
+<ul>
+<li>[Southbound] <strong>-</strong> Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.</li>
+<li>[Northbound] <strong>-</strong> Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.</li>
+</ul>
+<h5 id="parking"><strong>Parking</strong></h5>
+<p>The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.</p>
+<h5 id="public-transport"><strong>Public transport</strong></h5>
+<p>Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.</p>
+<ul>
+<li>Caltrain timetables: <a href="http://www.caltrain.com/schedules/weekdaytimetable.html">http://www.caltrain.com/schedules/weekdaytimetable.html</a></li>
+<li>Oracle Shuttle timetables: <a href="http://www.caltrain.com/schedules/weekdaytimetable.html">http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html</a></li>
+</ul>
+<p>You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.</p>
+<p>Alternatively, SamTrans (San Mateo County&rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/eleventh-tuc-meeting/index.html b/event/eleventh-tuc-meeting/index.html
new file mode 100644
index 00000000..9d811ea3
--- /dev/null
+++ b/event/eleventh-tuc-meeting/index.html
@@ -0,0 +1,534 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Eleventh TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Eleventh TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Eleventh TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">08 Jun 2018</strong></div>
+        
+        
+        
+        <h5>
+          Location: Austin, TX
+        </h5>
+        <h5>
+          
+          Event date: 08 Jun 2018 08:30 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.</p>
+<p>This TUC meeting will be a one-day event preceding the <a href="https://sigmod2018.org/">SIGMOD/PODS 2018</a> conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called <a href="https://sites.google.com/site/gradesnda2018/">GRADES-NDA 2018</a> as well, so you might combine travel.</p>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a> to register.</p>
+<p><strong>=&gt; registration is free, but required &lt;=</strong></p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (<a href="mailto:boncz@cwi.nl">boncz@cwi.nl</a>) and Larri (<a href="mailto:larri@ac.upc.ed">larri@ac.upc.edu</a>). Local organizer is Juan Sequeda (<a href="mailto:juanfederico@gmail.com">juanfederico@gmail.com</a>).</p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.</p>
+<h3 id="agenda">Agenda</h3>
+<p>In the TUC meeting there will be:</p>
+<ul>
+<li>updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.</li>
+<li>talks by data management practitioners highlighting graph data management challenges and products</li>
+</ul>
+<p>The meeting will start on Friday morning, with a program from 10:30-17:00:</p>
+<ul>
+<li>
+<p>10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting</p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf">10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo</a></p>
+</li>
+<li>
+<p>11:00-11:30 coffee break</p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf">11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf">11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf">12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI</a></p>
+</li>
+<li>
+<p>12:45-14:00 lunch</p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf">14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf">14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf">14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service</a></p>
+</li>
+<li>
+<p>15:15-15:40 coffee break</p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf">15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf">16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf">16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph</a></p>
+</li>
+<li>
+<p><a href="http://relational.ai/">16:55-17:20 Molham Aref (relational.ai)</a>) - Introducing.. <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf">relational.ai</a></p>
+</li>
+<li>
+<p>18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701</p>
+</li>
+</ul>
+<h3 id="location">Location</h3>
+<p>The TUC will be held at the <a href="https://www.cs.utexas.edu/">University of Texas at Austin, Department of Computer Science</a> in the <a href="https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348">Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712</a> Room: GDC 6.302</p>
+<p>The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.</p>
+<h3 id="from-austin-to-sigmodpods-houston-on-saturday-june-9">From Austin to SIGMOD/PODS (Houston) on Saturday June 9</h3>
+<p>Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.</p>
+<h4 id="bus">Bus</h4>
+<p>One option is to take a <a href="https://us.megabus.com/journey-planner/journeys?days=1&amp;concessionCount=0&amp;departureDate=2018-06-09&amp;destinationId=318&amp;inboundOtherDisabilityCount=0&amp;inboundPcaCount=0&amp;inboundWheelchairSeated=0&amp;nusCount=0&amp;originId=320&amp;otherDisabilityCount=0&amp;pcaCount=0&amp;totalPassengers=1&amp;wheelchairSeated=0">MegaBus that departs from downtown Austin and arrives at downtown Houston</a>.</p>
+<p>There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).</p>
+<p>If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/fifteenth-tuc-meeting/index.html b/event/fifteenth-tuc-meeting/index.html
new file mode 100644
index 00000000..173c0c5e
--- /dev/null
+++ b/event/fifteenth-tuc-meeting/index.html
@@ -0,0 +1,667 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fifteenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Fifteenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Fifteenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Gábor Szárnyas</strong> / on <strong class="text-dark">05 Apr 2022</strong></div>
+        
+        
+        
+        <h5>
+          Location: Philadelphia, Marriott Philadelphia Downtown
+        </h5>
+        <h5>
+          
+          Event dates: 17 Jun 2022 09:20 -- 18 Jun 2022 15:30  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p><strong>Organizers:</strong> Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2022.sigmod.org/venue.shtml">SIGMOD 2022</a> on <strong>June 17-18 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10-15 minute talks followed by a Q&amp;A session. The talks will be recorded and made available online.<br>
+The tenative program is the following. <strong>All times are in EDT.</strong></p>
+<p>We will have a social event on Friday at 17:30 at <a href="https://elvezrestaurant.com/">El Vez</a> (<a href="https://g.page/ElVezPhilly">Google Maps</a>).</p>
+<h4 id="friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml">Friday (<a href="https://www.paconvention.com/">Pennsylvania Convention Center</a>, <a href="https://2022.sigmod.org/program.shtml">room 204B</a>)</h4>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>finish</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>09:20</td>
+<td>09:30</td>
+<td>Peter Boncz (LDBC/CWI)</td>
+<td>State of the union – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf">slides</a>, <a href="https://youtu.be/39BoOIGk9Is">video</a></td>
+</tr>
+<tr>
+<td>09:30</td>
+<td>09:45</td>
+<td>Alastair Green (LDBC/Birkbeck)</td>
+<td>LDBC&rsquo;s fair use policies – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf">slides</a>, <a href="https://youtu.be/7zmCysN4Rpg">video</a></td>
+</tr>
+<tr>
+<td>09:50</td>
+<td>10:05</td>
+<td>Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)</td>
+<td>LDBC Social Network Benchmark: Business Intelligence workload v1.0 – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf">slides</a>, <a href="https://youtu.be/AJ96M8_njxE">video</a></td>
+</tr>
+<tr>
+<td>10:10</td>
+<td>10:25</td>
+<td>Heng Lin (Ant Group)</td>
+<td>LDBC Financial Benchmark introduction – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf">slides</a>, <a href="https://youtu.be/iBhud_YjafY">video</a></td>
+</tr>
+<tr>
+<td>10:30</td>
+<td>11:00</td>
+<td><em>coffee break</em></td>
+<td></td>
+</tr>
+<tr>
+<td>11:00</td>
+<td>11:15</td>
+<td>Chen Zhang (CreateLink)</td>
+<td>New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf">slides</a>, <a href="https://youtu.be/sMzTsb8iw_Y">video</a></td>
+</tr>
+<tr>
+<td>11:20</td>
+<td>11:35</td>
+<td>James Clarkson (Neo4j)</td>
+<td>LDBC benchmarks: Promoting good science and industrial consumption – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf">slides</a>, <a href="https://youtu.be/VYG1mzcl9qQ">video</a></td>
+</tr>
+<tr>
+<td>11:40</td>
+<td>11:55</td>
+<td>Oskar van Rest (Oracle)</td>
+<td>Creating and querying property graphs in Oracle, on-premise and in the cloud – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf">slides</a>, <a href="https://youtu.be/2HX2Vixf2gs">video</a></td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>12:15</td>
+<td>Mingxi Wu (TigerGraph)</td>
+<td>Conquering LDBC SNB BI at SF-10k – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf">slides</a>, <a href="https://youtu.be/oJbqzQ_t3G8">video</a></td>
+</tr>
+<tr>
+<td>12:20</td>
+<td>13:20</td>
+<td><em>lunch (on your own)</em></td>
+<td></td>
+</tr>
+<tr>
+<td>13:20</td>
+<td>13:35</td>
+<td>Altan Birler (Technische Universität München)</td>
+<td>Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf">slides</a>, <a href="https://youtu.be/cRgbdY3I2i4">video</a></td>
+</tr>
+<tr>
+<td>13:40</td>
+<td>13:55</td>
+<td>David Püroja (CWI)</td>
+<td>LDBC Social Network Benchmark: Interactive workload v2.0 – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf">slides</a></td>
+</tr>
+<tr>
+<td>14:00</td>
+<td>14:15</td>
+<td>Angela Bonifati (Lyon 1 University)</td>
+<td>The quest for schemas in graph databases – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf">slides</a>, <a href="https://youtu.be/VT7cx3Jp7V8">video</a></td>
+</tr>
+<tr>
+<td>14:20</td>
+<td>14:35</td>
+<td>Matteo Lissandrini (Aalborg University)</td>
+<td>Understanding graph data representations in triplestores – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf">slides</a>, <a href="https://youtu.be/xqVMJZfh_JU">video</a></td>
+</tr>
+<tr>
+<td>14:40</td>
+<td>14:55</td>
+<td>Wim Martens (University of Bayreuth)</td>
+<td>Path representations – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf">slides</a>, <a href="https://youtu.be/Ma-E5dwgf-E">video</a></td>
+</tr>
+<tr>
+<td>15:00</td>
+<td>15:20</td>
+<td>Audrey Cheng	(UC Berkeley)</td>
+<td>TAOBench: An end-to-end benchmark for social network workloads – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf">slides</a>, <a href="https://youtu.be/1p8AStxS3es">video</a></td>
+</tr>
+</tbody>
+</table>
+<h4 id="saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor">Saturday (<a href="https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/">Philadelphia Marriott Downtown</a>, room 401-402, 4th floor)</h4>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>finish</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>10:00</td>
+<td>10:15</td>
+<td>Keith Hare (WG3)</td>
+<td>An update on the GQL &amp; SQL/PGQ standards efforts – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf">slides</a>, <a href="https://youtu.be/xFVD3LWnKlc">video</a></td>
+</tr>
+<tr>
+<td>10:20</td>
+<td>10:35</td>
+<td>Leonid Libkin (ENS Paris)</td>
+<td>Pattern matching in GQL and SQL/PGQ  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf">slides</a>, <a href="https://youtu.be/OvGsa0qLANE">video</a></td>
+</tr>
+<tr>
+<td>10:40</td>
+<td>10:55</td>
+<td>Petra Selmer (Neo4j/WG3)</td>
+<td>An overview of GQL – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf">slides</a>, <a href="https://youtu.be/tncf2FgyIyo">video</a></td>
+</tr>
+<tr>
+<td>11:00</td>
+<td>11:15</td>
+<td>Alastair Green (LDBC/WG3)</td>
+<td>GQL 2.0: A technical manifesto – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf">slides</a>, <a href="https://youtu.be/upIvpYy8C2g">video</a></td>
+</tr>
+<tr>
+<td>11:20</td>
+<td>11:35</td>
+<td>George Fletcher (TU Eindhoven)</td>
+<td>PG-Keys (LDBC Property Graph Schema Working Group) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf">slides</a>, <a href="https://youtu.be/_W8-jOtcObc">video</a></td>
+</tr>
+<tr>
+<td>11:40</td>
+<td>11:55</td>
+<td>Arvind Shyamsundar (Microsoft)</td>
+<td>Graph capabilities in Microsoft SQL Server and Azure SQL Database – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf">slides</a>, <a href="https://youtu.be/xxV2BfZupGw">video</a></td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>13:30</td>
+<td><em>lunch (on your own)</em></td>
+<td></td>
+</tr>
+<tr>
+<td>13:30</td>
+<td>13:45</td>
+<td>Daniël ten Wolde (CWI)</td>
+<td>Implementing SQL/PGQ in DuckDB – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf">slides</a>, <a href="https://youtu.be/JmSfU0BTH5w">video</a></td>
+</tr>
+<tr>
+<td>13:50</td>
+<td>14:05</td>
+<td>Oszkár Semeráth, Kristóf Marussy (TU Budapest)</td>
+<td>Generation techniques for consistent, realistic, diverse, and scalable graphs – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf">slides</a>, <a href="https://youtu.be/hB6j6mvh-vA">video</a></td>
+</tr>
+<tr>
+<td>14:10</td>
+<td>14:25</td>
+<td>Molham Aref (RelationalAI)</td>
+<td>Graph Normal Form – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf">slides</a>, <a href="https://youtu.be/-kP4Raqr5KA">video</a></td>
+</tr>
+<tr>
+<td>14:30</td>
+<td>14:45</td>
+<td>Naomi Arnold (Queen Mary University of London)</td>
+<td>Temporal graph analysis of the far-right social network Gab – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf">slides</a>, <a href="https://youtu.be/ugSkFlif4PE">video</a></td>
+</tr>
+<tr>
+<td>14:50</td>
+<td>15:05</td>
+<td>Domagoj Vrgoč (PUC Chile)</td>
+<td>Evaluating path queries in MillenniumDB – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf">slides</a>, <a href="https://youtu.be/_OzJ6vI7GNU">video</a></td>
+</tr>
+<tr>
+<td>15:10</td>
+<td>15:25</td>
+<td>Pavel Klinov, Evren Sirin (Stardog)</td>
+<td>Stardog&rsquo;s experience with LDBC – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf">slides</a>, <a href="https://youtu.be/CBrEeOTqGKM">video</a></td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/fifth-tuc-meeting/index.html b/event/fifth-tuc-meeting/index.html
new file mode 100644
index 00000000..0ee34f1e
--- /dev/null
+++ b/event/fifth-tuc-meeting/index.html
@@ -0,0 +1,498 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fifth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Fifth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Fifth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark"> Irini Fundulaki</strong> / on <strong class="text-dark">14 Nov 2014</strong></div>
+        
+        
+        
+        <h5>
+          Location: Athens, Greece
+        </h5>
+        <h5>
+          
+          Event date: 14 Nov 2014 12:32 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium are pleased to announce its fifth Technical User<br>
+Community (TUC) meeting.</p>
+<p>This will be a one-day event at the National Hellenic Research Institute<br>
+in Athens, Greece on <strong>Friday November 14, 2014</strong>.</p>
+<h3 id="agenda">Agenda</h3>
+<p>10:30 - 11:00 Coffee Break</p>
+<p>11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp; LDBC project status update (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx">Presentation</a>)</p>
+<p>11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status</p>
+<p>Feedback &amp; Roadmap for SPB &amp; OWLIM (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf">Presentation</a>)</p>
+<p>11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp; Roadmap for SPB &amp; Virtuoso (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf">Presentation</a>)</p>
+<p>11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp; Roadmap for SNB &amp; Neo4J (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf">Presentation</a>)</p>
+<p>11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp; Roadmap for SNB &amp; Virtuoso (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf">Presentation</a>)</p>
+<p>12:00 - 12:20 Arnau Prat (UPC) &amp; Andrey Gubichev Status, Feedback &amp; Roadmap for SNB Interactive &amp; Sparksee (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf">Presentation</a> ) and Business Intelligence (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf">Presentation</a>)</p>
+<p>12:20 - 12:40 Tomer Sagi,  &ldquo;Experience with SNB and TitanDB at HP&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx">Presentation</a> )</p>
+<p>12:40 - 13:00 Jakob Nelson,   &ldquo;graphbench.org on the SNB datagen&rdquo;</p>
+<p>13:00 - 14:30 Lunch Break@Byzantine &amp; Christian Museum (<a href="http://www.byzantinemuseum.gr/en/">link</a>)</p>
+<p>14:30 - 14:50 Olaf Hartig, &ldquo;Integrating the Property Graph and RDF data models&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf">Presentation</a>)\</p>
+<p>Documents: <a href="http://arxiv.org/abs/1409.3288">arxiv/1409.3288</a>, <a href="http://arxiv.org/abs/1406.3399">arxiv/1406.3399</a></p>
+<p>14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf">Presentation</a>)</p>
+<p>15:10 - 15:30 Evaggelia Pitoura, &ldquo;Historical Queries on Graphs&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf">Presentation</a>)</p>
+<p>15:30 - 16:00 Coffee Break</p>
+<p>16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf">Presentation</a>)</p>
+<p>16:20 - 16:40 Gunes Aluc, &ldquo;WatDiv: How to Tune-up your RDF Data Management System&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf">Presentation</a>)</p>
+<p>16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &ldquo;Benchmarking @LogicBlox&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf">Presentation</a>)</p>
+<p>17:00 - 17:15 Hassan Chafi, &ldquo;Oracle Labs Graph Strategy&rdquo;</p>
+<p>17:15 - 17:25 Yinglong Xia, &ldquo;Property Graphs for Industry Solution at IBM&rdquo; (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf">Presentation</a>)</p>
+<p>17:25 - 17:30 Arthur Keen, &ldquo;Short Introduction to SPARQLcity&rdquo;</p>
+<p><em><strong>20:30 Dinner @ Konservokouti <a href="https://plus.google.com/114240752029716758955/about?gl=gr&amp;hl=en">(link)</a></strong></em></p>
+<p><em><strong>Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion</strong></em></p>
+<h4 id="logistics">Logistics</h4>
+<p>The meeting will be held at the <a href="http://www.eie.gr/index-en.html">National Hellenic Research Foundation</a> located in <a href="http://www.eie.gr/location-en.html">downtown Athens</a>.</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif" alt=""></p>
+<h4 id="travel">Travel</h4>
+<p>Athens, Greece&rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.</p>
+<p>To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).</p>
+<p>You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: <a href="http://www.aia.gr/traveler/">http://www.aia.gr/traveler/</a></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/first-tuc-meeting/index.html b/event/first-tuc-meeting/index.html
new file mode 100644
index 00000000..a40a0691
--- /dev/null
+++ b/event/first-tuc-meeting/index.html
@@ -0,0 +1,553 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>First TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">First TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">First TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Barry Bishop</strong> / on <strong class="text-dark">22 Nov 2012</strong></div>
+        
+        
+        
+        <h5>
+          Location: Barcelona, Spain
+        </h5>
+        <h5>
+          
+          Event dates: 19 Nov 2012 09:00 -- 20 Nov 2012 17:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the <strong>19/20th November 2012</strong>.</p>
+<p>So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:</p>
+<ul>
+<li>Introduction by the coordinator and technical director explaining the objectives of the LDBC project</li>
+<li>Invitation to users to explain their use-cases and describe the limitations they have found in current technology</li>
+<li>Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points</li>
+</ul>
+<p>The exact agenda will be published here as things get finalised before the event.</p>
+<p>All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu</p>
+<ul>
+<li><a href="#agenda">Agenda</a></li>
+<li><a href="#slide">Slide</a>
+<ul>
+<li><a href="#logistics">Logistics</a>
+<ul>
+<li><a href="#date">Date</a></li>
+<li><a href="#location">Location</a></li>
+</ul>
+</li>
+<li><a href="#venue">Venue</a></li>
+<li><a href="#getting-there">Getting there</a></li>
+</ul>
+</li>
+</ul>
+<h3 id="agenda">Agenda</h3>
+<p>We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.</p>
+<p><strong>Day 1</strong></p>
+<p>09:00 Welcome (Location: Aula Master)<br>
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?<br>
+10:30 Coffee break<br>
+11:00 User talks (To gather information for use cases?)</p>
+<p>13:00 Lunch</p>
+<p>14:00 User talks (cont.)<br>
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).<br>
+16:00 Task force proposals (consortium)<br>
+17:00 Finish first day</p>
+<p>20:00 Social dinner</p>
+<p><strong>Day 2</strong></p>
+<p>10:00 Task force discussion (consortium + TUC)<br>
+11:00 Coffe break<br>
+11:30 Task force discussion (consortium + TUC)<br>
+12:30 Summaries (Task forces, use cases, &hellip;) and actions</p>
+<p>13:00 Lunch and farewell</p>
+<p>15:00 LDBC Internal meeting</p>
+<h3 id="slide">Slide</h3>
+<p>Opening session:</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx">CWI – Peter Boncz</a> – Objectives</li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf">UPC – Larri</a> – Questionnaire</li>
+</ul>
+<p>User stories:</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf">BBC – Jem Rayfield</a></li>
+<li>CA Technologies – Victor Muntés</li>
+<li>Connected Discovery (Open Phacts) – Bryn Williams-Jones</li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx">Elsevier – Alan Yagoda</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx">ERA7 Bioinformatics – Eduardo Pareja</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx">Press Association – Jarred McGinnis</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx">RJLee – David Neuer</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf">Yale – Lec Maj</a></li>
+</ul>
+<p>Benchmark proposals:</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf">Publishing benchmark proposal – Ontotext – Barry Bishop</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf">Social Network Benchmark Proposal – UPC – Larri</a></li>
+</ul>
+<h4 id="logistics">Logistics</h4>
+<h5 id="date">Date</h5>
+<p>19th and 20th November 2012</p>
+<h5 id="location">Location</h5>
+<p>The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:</p>
+<p>Aula Master<br>
+Edifici A3, Campus Nord UPC<br>
+C. Jordi Girona, 1-3<br>
+08034 Barcelona, Spain</p>
+<h4 id="venue">Venue</h4>
+<p>To reach the campus, there are several options, including Taxi, <a href="http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;groupId=10168">Metro</a> and <a href="http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;groupId=10168">Bus</a>.</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg" alt=""></p>
+<p><strong>Finding UPC</strong></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg" alt=""></p>
+<p><strong>Finding the meeting room</strong></p>
+<h4 id="getting-there">Getting there</h4>
+<p><strong>Flying:</strong> Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this <a href="http://goo.gl/maps/iJqlj">map of the airport</a>). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.</p>
+<p><strong>Rail:</strong> The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.</p>
+<p><strong>Bus:</strong> The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.</p>
+<p><strong>Taxi:</strong> From the airport, you can take one of Barcelona&rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.</p>
+<p><strong>Train and bus:</strong> Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: <a href="http://www.barcelona-airport.com/eng/transport_eng.htm">http://www.barcelona-airport.com/eng/transport_eng.htm</a></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg" alt=""></p>
+<p><strong>The locations of the airport and the city centre</strong></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg" alt=""></p>
+<p><strong>Bus map</strong></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/fourteenth-tuc-meeting/index.html b/event/fourteenth-tuc-meeting/index.html
new file mode 100644
index 00000000..5b729ce8
--- /dev/null
+++ b/event/fourteenth-tuc-meeting/index.html
@@ -0,0 +1,598 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fourteenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Fourteenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Fourteenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Gábor Szárnyas</strong> / on <strong class="text-dark">17 Jun 2021</strong></div>
+        
+        
+        
+        <h5>
+          Location: Copenhagen, Tivoli Hotel, room Akvariet 2
+        </h5>
+        <h5>
+          
+          Event dates: 16 Aug 2021 16:00 -- 16 Aug 2021 20:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>LDBC was hosting a one-day hybrid workshop, co-located with <a href="https://vldb.org/2021/">VLDB 2021</a> on <strong>August 16 (Monday) between 16:00–20:00 CEST</strong>.</p>
+<p>The physical part of the workshop was held in room Akvariet 2 of the <a href="https://www.tivolihotel.com/">Tivoli Hotel</a> (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.</p>
+<p>Talks were scheduled to be 10 minutes with a short Q&amp;A session. We had three sessions. Their schedules are shown below.</p>
+<h4 id="16001725-cest-ldbc-updates-benchmarks-query-languages">[16:00–17:25 CEST] LDBC updates, benchmarks, query languages</h4>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>16:00</td>
+<td>Peter Boncz (CWI)</td>
+<td>State of the union – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf">slides</a></td>
+</tr>
+<tr>
+<td>16:05</td>
+<td>Gábor Szárnyas (CWI)</td>
+<td>Overview of LDBC benchmarks – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf">slides</a></td>
+</tr>
+<tr>
+<td>16:12</td>
+<td>Mingxi Wu (TigerGraph)</td>
+<td>LDBC Social Network Benchmark results with TigerGraph – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf">slides</a></td>
+</tr>
+<tr>
+<td>16:24</td>
+<td>Xiaowei Zhu (Ant Group)</td>
+<td>Financial Benchmark proposal – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf">slides</a></td>
+</tr>
+<tr>
+<td>16:36</td>
+<td>Petra Selmer (Neo4j)</td>
+<td>Status report from the Existing Languages Working Group (ELWG) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf">slides</a>, <a href="https://youtu.be/I5A8VuFDhsA">video</a></td>
+</tr>
+<tr>
+<td>16:48</td>
+<td>Jan Hidders (Birkbeck)</td>
+<td>Status report from the Property Graph Schema Working Group (PGSWG) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf">slides</a>, <a href="https://youtu.be/iEbVi9T-HVk">video</a></td>
+</tr>
+<tr>
+<td>17:00</td>
+<td>Keith Hare (JCC Consulting)</td>
+<td>Database Language Standards Structure and Process, SQL/PGQ – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf">slides</a>, <a href="https://youtu.be/ZgFCuzods4g">video</a></td>
+</tr>
+<tr>
+<td>17:12</td>
+<td>Stefan Plantikow (GQL Editor)</td>
+<td>Report on the GQL standard – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf">slides</a>, <a href="https://youtu.be/z0pN5NwKsgc">video</a></td>
+</tr>
+</tbody>
+</table>
+<p><em>coffee break (10 minutes)</em></p>
+<h4 id="17351845-cest-systems-and-data-structures">[17:35–18:45 CEST] Systems and data structures</h4>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>17:35</td>
+<td>Vasileios Trigonakis (Oracle Labs)</td>
+<td>PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf">slides</a>, <a href="https://youtu.be/cv2ZfWRBOek">video</a></td>
+</tr>
+<tr>
+<td>17:47</td>
+<td>Matthias Hauck (SAP)</td>
+<td>JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf">slides</a>, <a href="https://youtu.be/dgpMJFho6Q8">video</a></td>
+</tr>
+<tr>
+<td>17:59</td>
+<td>Nikolay Yakovets (Eindhoven University of Technology)</td>
+<td>AvantGraph  – <a href="https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf">slides</a>, <a href="https://youtu.be/9M9FOycovTw">video</a></td>
+</tr>
+<tr>
+<td>18:11</td>
+<td>Semih Salihoglu (University of Waterloo)</td>
+<td>GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf">slides</a>, <a href="https://youtu.be/FFK3y6vPHJs">video</a></td>
+</tr>
+<tr>
+<td>18:23</td>
+<td>Semyon Grigorev (Saint Petersburg University)</td>
+<td>Context-free path querying: Obstacles on the way to adoption  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf">slides</a>, <a href="https://youtu.be/pha1xIpEL3I">video</a></td>
+</tr>
+<tr>
+<td>18:35</td>
+<td>Per Fuchs (Technical University of Munich)</td>
+<td>Sortledton: A universal, transactional graph data structure  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf">slides</a>, <a href="https://youtu.be/33ZjsNN0hhU">video</a></td>
+</tr>
+</tbody>
+</table>
+<p><em>coffee break (10 minutes)</em></p>
+<h4 id="1855-2000-cest-high-level-approaches-and-benchmarks">[18:55-20:00 CEST] High-level approaches and benchmarks</h4>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>18:55</td>
+<td>Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)</td>
+<td>Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf">slides</a>, <a href="https://youtu.be/a1VYjyec8dg">video</a></td>
+</tr>
+<tr>
+<td>19:07</td>
+<td>Vasia Kalavri (Boston University)</td>
+<td>Learning to partition unbounded graph streams – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf">slides</a>, <a href="https://youtu.be/PTlUABKWniA">video</a></td>
+</tr>
+<tr>
+<td>19:19</td>
+<td>Muhammad Attahir Jibril (TU Ilmenau)</td>
+<td>Towards a Hybrid OLTP-OLAP Graph Benchmark – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf">slides</a>, <a href="https://youtu.be/tMBVszTSJXc">video</a></td>
+</tr>
+<tr>
+<td>19:31</td>
+<td>Riccardo Tommasini (University of Tartu)</td>
+<td>An outlook on Benchmarks for Graph Stream Processing – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf">slides</a>, <a href="https://youtu.be/HabvJvPXsLc">video</a></td>
+</tr>
+<tr>
+<td>19:43</td>
+<td>Mohamed Ragab (University of Tartu)</td>
+<td>Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf">slides</a>, <a href="https://youtu.be/mZ8LhGUq7Wg">video</a></td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/fourth-tuc-meeting/index.html b/event/fourth-tuc-meeting/index.html
new file mode 100644
index 00000000..d42ad0f8
--- /dev/null
+++ b/event/fourth-tuc-meeting/index.html
@@ -0,0 +1,565 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fourth TUC meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Fourth TUC meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Fourth TUC meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">03 Apr 2014</strong></div>
+        
+        
+        
+        <h5>
+          Location: Amsterdam, netherlands
+        </h5>
+        <h5>
+          
+          Event date: 03 Apr 2014 12:32 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.</p>
+<p>This will be a one-day event at CWI in Amsterdam on <em>Thursday April 3, 2014</em>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology.</li>
+<li>Industry discussions on the contents of the benchmarks.</li>
+</ul>
+<p>All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu</p>
+<p><strong>For presenters please limit your talks to just 15 minutes</strong></p>
+<h3 id="agenda">Agenda</h3>
+<p><strong>April 3rd</strong></p>
+<ul>
+<li>
+<p>10:00 Peter Boncz (VUA) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=JYWVgrP1kVY">video</a>: <em>LDBC project status update</em></p>
+</li>
+<li>
+<p>10:20 Norbert Martinez (UPC) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf">pdf</a>, <a href="https://www.youtube.com/watch?v=4yREJQ3yDr0">video</a>: <em>Status update on the LDBC Social  Network Benchmark (SNB) task force</em>.</p>
+</li>
+<li>
+<p>10:50 Alexandru Iosup (TU Delft) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt">ppt</a>, <a href="https://www.youtube.com/watch?v=ulT-RFwKpOE">video</a>: <em>Towards Benchmarking Graph-Processing Platforms</em></p>
+</li>
+<li>
+<p>11:10 Mike Bryant (Kings College) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=KiHRTu9xx0A">video</a>: <em>EHRI Project: Archival Integration with Neo4j</em></p>
+</li>
+</ul>
+<p><strong>11:30 coffee</strong></p>
+<ul>
+<li>
+<p>11:50 Thilo Muth (University of Magdeburg) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=5xH3UDLP6Oc">video</a>: <em>MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis</em></p>
+</li>
+<li>
+<p>12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp; Johnson) – <a href="https://www.youtube.com/watch?v=XN3LRJUfJIU">video</a>: <em>Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph</em></p>
+</li>
+<li>
+<p>12:30 Yongming Luo (TU Eindhoven) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf">pdf</a>, <a href="https://www.youtube.com/watch?v=g_my3tBB2_s">video</a>: <em>Regularities and dynamics in bisimulation reductions of big graphs</em></p>
+</li>
+<li>
+<p>12:50 Christopher Davis (TU Delft) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf">pdf</a>, <a href="https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag">video</a>: <em>Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues</em></p>
+</li>
+</ul>
+<p><strong>13:10 - 14:30 lunch @ restaurant Polder</strong></p>
+<ul>
+<li>
+<p>14:30 <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx">SPB task force report</a></p>
+</li>
+<li>
+<p>15:00 Bastiaan Bijl (Sysunite) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf">pdf</a>, <a href="https://www.youtube.com/watch?v=TsCeKDHShMY">video</a>: <em>Using a semantic approach for monitoring applications in large engineering projects</em></p>
+</li>
+<li>
+<p>15:20 Frans Knibbe (Geodan) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=uAX-m4OewPM">video</a>: <em>Benchmarks for geographical data</em></p>
+</li>
+<li>
+<p>15:40 Armando Stellato (University of Rome, Tor Vergata &amp; UN Food and Agriculture Organization) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=mfA4csAs72Y">video</a>: <em>VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges</em></p>
+</li>
+</ul>
+<p><strong>16:00 coffee</strong></p>
+<ul>
+<li>
+<p>16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), <a href="https://www.youtube.com/watch?v=ZUDnVw9P_Rc">video</a>:<em>Customer experiences in implementing SKOS-based vocabularymanagement systems</em></p>
+</li>
+<li>
+<p>16:40 Simon Jupp (European Bioinformatics Institute) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf">pdf</a>, <a href="https://www.youtube.com/watch?v=CgTuOGK92W8">video</a>: <em>[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]</em></p>
+</li>
+<li>
+<p>17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf">pdf</a>, <a href="https://www.youtube.com/watch?v=QTc3yOgoEsg">video</a>: <em>Breakmarking UniProt RDF. SPARQL queries that make your database cry&hellip;</em></p>
+</li>
+<li>
+<p>17:20 Rein van &rsquo;t Veer (Digital Heritage Netherlands) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx">pptx</a>, <a href="https://www.youtube.com/watch?v=2vDrZoskGyQ">video</a> <em>Time and space for heritage</em></p>
+</li>
+<li>
+<p>17:40 <strong>end of meeting</strong></p>
+</li>
+<li>
+<p>19:00 - 21:30 Social Dinner in restaurant Boom</p>
+</li>
+</ul>
+<p><strong>April 4th</strong></p>
+<p>LDBC plenary meeting for project partners.</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt">Benchmarking Graph-Processing Platforms: A Vision</a> – Alexandru Iosup</li>
+</ul>
+<h3 id="logistics">Logistics</h3>
+<p>The meeting will be held at the Dutch national research institute for computer science and mathematics (<a href="http://www.cwi.nl">CWI</a> - Centrum voor Wiskunde en Informatica). It is located at <a href="http://www.amsterdamsciencepark.nl/">Amsterdam Science Park</a>:</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg" alt=""></p>
+<p>(<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf">A5 map</a>)</p>
+<h6 id="travel">Travel</h6>
+<p><strong>Arriving &amp; departing:</strong></p>
+<p>Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, <a href="http://www.schiphol.com/">www.schiphol.nl</a>) that serves all main European carriers and also very many low-fare carriers.</p>
+<p><a href="http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane">http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane</a></p>
+<p><strong>Trains</strong> (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &ndash; which station you are also likely arriving at in case of an international train trip.</p>
+<p>From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).</p>
+<p><strong>Taxi</strong> is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).</p>
+<p><strong>Public transportation</strong> (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.</p>
+<p><strong>Only the &ldquo;disposable&rdquo; cards are interesting for you as visitor.</strong></p>
+<p>Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.</p>
+<p><strong>Getting Around:</strong> the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.</p>
+<p><strong>Cars</strong></p>
+<p>In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &ldquo;WCW&rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.</p>
+<p><strong>Arriving at CWI:</strong> Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&rsquo;ll receive a visitor&rsquo;s pass that allows you to enter our building.</p>
+<p><strong>Social Dinner</strong></p>
+<p>The social dinner will take place at 7pm on April 3 in Restaurant Boom (<a href="http://www.boometenendrinken.nl/">boometenendrinken.nl</a>), Linneausstraat 63, Amsterdam.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/index.html b/event/index.html
new file mode 100644
index 00000000..e51d0710
--- /dev/null
+++ b/event/index.html
@@ -0,0 +1,659 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Events</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Events</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Events</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">Eighteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located in <strong>Guangzhou</strong> with <a href="https://vldb.org/2024/">VLDB 2024</a> on <strong>August 30-31 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/aVPrrcxXpSwrWPnh6">our form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in PDT.</strong></p>
+<h4 id="august-30-friday">August 30, Friday …</h4>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">Seventeenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    , SANTIAGO
+    , CHILE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El Bosque Ebro</strong> (<a href="https://www.plazaelbosque.cl">https://www.plazaelbosque.cl</a>), which is two blocks away from SIGMOD&rsquo;s venue. See the map <a href="https://maps.app.goo.gl/78oiw3zo2pH3gy5R6">here</a>.</p>
+<p><strong>If you would like to participate please register using <a href="https://forms.gle/XXgaQfwBZAMMZJb78">this form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in Chile time (GMT-4).</strong></p>
+<p><strong>Each speaker will …</strong></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/sixteenth-tuc-meeting/">Sixteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Oskar van Rest, Alastair Green, Gábor Szárnyas</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2023.sigmod.org/venue.shtml">SIGMOD 2023</a> on <strong>June 23-24 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/T6bwVHzK9V5FaKyR9">our form</a>.</strong></p>
+<p>LDBC will host a <strong>social event</strong> on Friday at the <a href="https://www.blackbottleseattle.com/">Black Bottle gastrotavern</a> in Belltown: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fifteenth-tuc-meeting/">Fifteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2022.sigmod.org/venue.shtml">SIGMOD 2022</a> on <strong>June 17-18 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10-15 minute talks followed by a Q&amp;A session. The talks will be recorded and made available online.<br>
+The tenative program is the following. <strong>All times are in EDT.</strong></p>
+<p>We will have a social event on Friday at 17:30 at <a href="https://elvezrestaurant.com/">El Vez</a> (<a href="https://g.page/ElVezPhilly">Google Maps</a>).</p>
+<h4 id="friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml">Friday ( …</h4>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fourteenth-tuc-meeting/">Fourteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC was hosting a one-day hybrid workshop, co-located with <a href="https://vldb.org/2021/">VLDB 2021</a> on <strong>August 16 (Monday) between 16:00–20:00 CEST</strong>.</p>
+<p>The physical part of the workshop was held in room Akvariet 2 of the <a href="https://www.tivolihotel.com/">Tivoli Hotel</a> (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/thirteenth-tuc-meeting/">Thirteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/event/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/event/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/event/page/3/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/index.xml b/event/index.xml
new file mode 100644
index 00000000..c2ba7581
--- /dev/null
+++ b/event/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Events on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/event/</link>
+    <description>Recent content in Events on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 30 Aug 2024 09:00:00 -0800</lastBuildDate><atom:link href="https://ldbcouncil.org/event/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/event/ninth-tuc-meeting/index.html b/event/ninth-tuc-meeting/index.html
new file mode 100644
index 00000000..cce5ecc8
--- /dev/null
+++ b/event/ninth-tuc-meeting/index.html
@@ -0,0 +1,703 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Ninth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Ninth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Ninth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Marcus Paradies</strong> / on <strong class="text-dark">14 Feb 2017</strong></div>
+        
+        
+        
+        <h5>
+          Location: SAP Headquarters in Walldorf Germany
+        </h5>
+        <h5>
+          
+          Event dates: 09 Feb 2017 15:07 -- 10 Feb 2017 15:07  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf">SAP Headquarters</a> in Walldorf, Germany on February 9+10, 2017.</p>
+<p>This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the benchmarking results for the different benchmarks.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a>;</p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.</p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.</p>
+<h3 id="agenda">Agenda</h3>
+<p>In the TUC meeting there will be</p>
+<ul>
+<li>updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.</li>
+<li>talks by data management practitioners highlighting graph data management challenges</li>
+<li>selected scientific talks on graph data management technology</li>
+</ul>
+<p>The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.</p>
+<p>Thursday evening (19:00-21:00) there will be a <strong>social dinner</strong> in Heidelberg.</p>
+<p>Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.</p>
+<h4 id="social-dinner">Social Dinner</h4>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png" alt=""></p>
+<p><strong>Address: Hauptstraße 217, 69117 Heidelberg</strong><br>
+<strong>Time: 19:00 / 7pm</strong></p>
+<p>(See attachments at the bottom of the page)</p>
+<h5 id="thursday">Thursday</h5>
+<table>
+<thead>
+<tr>
+<th>start time</th>
+<th>title – speaker</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>9:00</td>
+<td>Welcome and logistics - Marcus Paradies (SAP)</td>
+</tr>
+<tr>
+<td>9:10</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf">Intro + state of the LDBC - Josep Lluis Larriba Pey</a> (UPC)</td>
+</tr>
+<tr>
+<td>9:20</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf">LDBC Graph QL task force</a> - Hannes Voigt (TU Dresden)</td>
+</tr>
+<tr>
+<td>9:40</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf">PGQL Status Update and Comparison to LDBC&rsquo;s Graph QL proposals</a> - Oskar van Rest (Oracle Labs)</td>
+</tr>
+<tr>
+<td>10:00</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf">Adding shortest-paths to MonetDB</a> - Dean de Leo (CWI)</td>
+</tr>
+<tr>
+<td>10:20</td>
+<td>coffee</td>
+</tr>
+<tr>
+<td>10:50</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf">Evolving Cypher for processing multiple graphs</a> - Stefan Plantikow (Neo Technology)</td>
+</tr>
+<tr>
+<td>11:10</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf">Standardizing Graph Database Functionality - An Invitation to Collaborate</a> - Jan Michels (ISO/ANSI SQL, Oracle)&quot;</td>
+</tr>
+<tr>
+<td>11:30</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf">Dgraph: Graph database for production environment</a> - Tomasz Zdybal (Dgraph.io)</td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>lunch</td>
+</tr>
+<tr>
+<td>13:00</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf">LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap</a> - Alexandru Iosup (TU Delft)</td>
+</tr>
+<tr>
+<td>13:20</td>
+<td>LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)</td>
+</tr>
+<tr>
+<td>13:40</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf">LDBC SNB Datagen Update</a> - Arnau Prat (UPC)</td>
+</tr>
+<tr>
+<td>14:00</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf">LDBC SNB Business Intelligence Workload: Chokepoint Analysis</a> - Arnau Prat (UPC)</td>
+</tr>
+<tr>
+<td>14:20</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf">LDBC Benchmark Cost Specification</a> (+discussion) - Moritz Kaufmann (TU Munich)</td>
+</tr>
+<tr>
+<td>14:40</td>
+<td>coffee break</td>
+</tr>
+<tr>
+<td>15:10</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf">EYWA: the Distributed Graph Engine in Huawei MIND Platform</a> (Yinglong Xia)</td>
+</tr>
+<tr>
+<td>15:30</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf">Graph Processing in SAP HANA</a> - Marcus Paradies (SAP)</td>
+</tr>
+<tr>
+<td>15:50</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf">Distributed Graph Analytics with Gradoop</a> - Martin Junghanns (Univ Leipzig)</td>
+</tr>
+<tr>
+<td>16:10</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf">Distributed graph flows: Cypher on Flink and Gradoop</a> - Max Kießling (Neo Technology)</td>
+</tr>
+<tr>
+<td>16:30</td>
+<td>closing - Peter Boncz</td>
+</tr>
+<tr>
+<td>17:30</td>
+<td>end</td>
+</tr>
+</tbody>
+</table>
+<h5 id="friday">Friday</h5>
+<table>
+<thead>
+<tr>
+<th>start time</th>
+<th>title – speaker</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>9:00</td>
+<td>welcome - Peter Boncz</td>
+</tr>
+<tr>
+<td>9:20</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf">Graph processing in obi4wan</a> - Frank Smit (OBI4WAN)</td>
+</tr>
+<tr>
+<td>9:40</td>
+<td>Graph problems in the space domain - Albrecht Schmidt (ESA)</td>
+</tr>
+<tr>
+<td>10:00</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf">Medical Ontologies for Healthcare</a> - Michael Neumann (SAP)</td>
+</tr>
+<tr>
+<td>10:20</td>
+<td>coffee</td>
+</tr>
+<tr>
+<td>10:50</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf">The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries</a> - Gabor Szarnyas (BME)</td>
+</tr>
+<tr>
+<td>11:10</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf">Efficient sparse matrix computations and their generalization to graph computing applications</a> - Albert-Jan Yzelman (Huawei)</td>
+</tr>
+<tr>
+<td>11:30</td>
+<td><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf">Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge</a> - Atanas Kyriakov (Ontotext)</td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>lunch</td>
+</tr>
+<tr>
+<td>13:00</td>
+<td>LDBC Board of Directors Meeting</td>
+</tr>
+<tr>
+<td>17:00</td>
+<td>end</td>
+</tr>
+</tbody>
+</table>
+<h3 id="logistics">Logistics</h3>
+<h5 id="important-things-to-know"><strong>Important things to know</strong></h5>
+<p>The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: <a href="https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf">link</a></p>
+<h5 id="venue"><strong>Venue</strong></h5>
+<p>The TUC meeting will be held in the <a href="https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf">SAP Headquarters</a> at the SAP Guesthouse Kalipeh (<a href="https://www.kalipeh.com">https://www.kalipeh.com</a>). The address is:</p>
+<p><strong>WDF 44 / SAP Guesthouse Kalipeh<br>
+Dietmar-Hopp-Allee 15<br>
+69190 Walldorf<br>
+Germany</strong></p>
+<h6 id="maps-and-situation"><strong>Maps and situation</strong></h6>
+<p><a href="https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111">Google Maps link</a></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png" alt=""></p>
+<h4 id="getting-there"><strong>Getting there</strong></h4>
+<h5 id="by-plane"><strong>By plane</strong></h5>
+<p>There are two airports close to SAP&rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.</p>
+<p>When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.</p>
+<p>The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).</p>
+<p>Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).</p>
+<h6 id="driving-directions"><strong>Driving directions</strong></h6>
+<p><strong>Traveling from Frankfurt Airport (FRA) to SAP Headquarters:</strong></p>
+<p>Directions to SAP headquarters:</p>
+<ul>
+<li>When leaving the airport, follow the highway symbol onto &ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&rdquo;</li>
+<li>Follow the A5 to &ldquo;Basel/Karlsruhe/Heidelberg.&rdquo;</li>
+<li>Take exit 39 &ndash; &ldquo;Walldorf/Wiesloch.&rdquo;</li>
+<li>Turn left onto B291.</li>
+<li>Turn right onto Dietmar-Hopp-Allee.</li>
+</ul>
+<p>(Should you use a navigational system which does not recognize the street name &lsquo;Dietmar-Hopp-Allee&rsquo; please use &lsquo;Neurottstrasse&rsquo; instead.)</p>
+<p><strong>Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:</strong></p>
+<p>To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.</p>
+<p>Directions to SAP headquarters:</p>
+<ul>
+<li>When leaving the airport, follow the highway symbol onto &ldquo;A8/Stuttgart/B27.&rdquo;</li>
+<li>Stay on A8 and follow the sign for &ldquo;Karlsruhe/Heilbronn/Singen/A8.&rdquo;</li>
+<li>Follow A8 to Karlsruhe.</li>
+<li>Take exit 41 &ndash; &ldquo;Dreieck Karlsruhe&rdquo; to merge onto A5 toward &ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&rdquo;</li>
+<li>Take exit 39 &ndash; &ldquo;Walldorf/Wiesloch.&rdquo;</li>
+<li>Turn left onto B291.</li>
+<li>Turn right onto Dietmar-Hopp-Allee.</li>
+</ul>
+<h6 id="parking"><strong>Parking</strong></h6>
+<p>The closest parking lot to the event location is P7 (see figure above).</p>
+<h5 id="by-train"><strong>By Train</strong></h5>
+<p>As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.</p>
+<p><strong>From Frankfurt Airport (FRA) to SAP Headquarters</strong></p>
+<p>Directions to SAP headquarters:</p>
+<ul>
+<li>Go to Terminal 1, level T (see overview in Appendix).</li>
+<li>Go to the AIRail Terminal &ndash; &ldquo;Fernbahnhof&rdquo; (long-distance trains).</li>
+<li>Choose a connection with the destination train station &ldquo;Wiesloch&ndash;Walldorf&rdquo;.</li>
+<li>From station &ldquo;Wiesloch&ndash;Walldorf,&rdquo; take bus number 707 or 721 toward &ldquo;Industriegebiet Walldorf, SAP.&rdquo; It is a 10-minute ride to reach bus stop &lsquo;SAP headquarters&rsquo;.</li>
+</ul>
+<p><strong>From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters</strong></p>
+<p>Directions to SAP headquarters:</p>
+<ul>
+<li>Go to the S-Bahn station in the airport, following the sign (station is called &ldquo;Stuttgart Flughafen/Messe&rdquo;).</li>
+<li>Take train number S2 or S3 to &ldquo;Stuttgart Hauptbahnhof&rdquo; (main station).</li>
+<li>From Stuttgart Hauptbahnhof choose a connection with the destination train station &ldquo;Wiesloch&ndash;Walldorf&rdquo;.</li>
+<li>From station &ldquo;Wiesloch&ndash;Walldorf,&rdquo; take bus number 707 or 721 toward &ldquo;Industriegebiet Walldorf, SAP&rdquo;. It is a 10-minute ride to reach bus stop &lsquo;SAP headquarters&rsquo;.</li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/page/1/index.html b/event/page/1/index.html
new file mode 100644
index 00000000..7fa970fd
--- /dev/null
+++ b/event/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/event/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/event/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/event/">
+  </head>
+</html>
diff --git a/event/page/2/index.html b/event/page/2/index.html
new file mode 100644
index 00000000..bedd856f
--- /dev/null
+++ b/event/page/2/index.html
@@ -0,0 +1,670 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Events</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Events</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Events</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/twelfth-tuc-meeting/">Twelfth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eleventh-tuc-meeting/">Eleventh TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.</p>
+<p>This TUC meeting will be a one-day event preceding the <a href="https://sigmod2018.org/">SIGMOD/PODS …</a></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/tenth-tuc-meeting/">Tenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This will be a one-day event at the <a href="http://www.vldb.org/2017">VLDB 2017</a> conference in Munich, Germany on September 1, 2017.</p>
+<p>Topics and activities of interest in these TUC meetings are:</p>
+<ul>
+<li>Presentation on graph data management usage scenarios.</li>
+<li>Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/ninth-tuc-meeting/">Ninth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf">SAP Headquarters</a> in Walldorf, Germany on February 9+10, 2017.</p>
+<p>This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eighth-tuc-meeting/">Eighth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event/eighth-tuc-meeting/attachments at <a href="http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf">Oracle Conference Center</a> in Redwood Shores facility on <strong>Wednesday and Thursday June 22-23, 2016</strong>.</p>
+<p>This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:</p>
+<ul>
+<li>Two day …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventh-tuc-meeting/">Seventh TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="http://www.research.ibm.com/labs/watson">IBM&rsquo;s TJ Watson</a> facility on <strong>Monday and Tuesday November 9/10, 2015.</strong></p>
+<p>This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/event/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/event/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/event/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/event/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/event/page/3/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/page/3/index.html b/event/page/3/index.html
new file mode 100644
index 00000000..17718244
--- /dev/null
+++ b/event/page/3/index.html
@@ -0,0 +1,666 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Events</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Events</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Events</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/sixth-tuc-meeting/">Sixth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on <strong>Thursday and Friday March 19/20, 2015.</strong></p>
+<p>The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fifth-tuc-meeting/">Fifth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce its fifth Technical User<br>
+Community (TUC) meeting.</p>
+<p>This will be a one-day event at the National Hellenic Research Institute<br>
+in Athens, Greece on <strong>Friday November 14, 2014</strong>.</p>
+<h3 id="agenda">Agenda</h3>
+<p>10:30 - 11:00 Coffee Break</p>
+<p>11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp; LDBC project status update (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx">Presentation</a>)</p>
+<p>11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status</p>
+<p>Feedback …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fourth-tuc-meeting/">Fourth TUC meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.</p>
+<p>This will be a one-day event at CWI in Amsterdam on <em>Thursday April 3, 2014</em>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology. …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/third-tuc-meeting/">Third TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!</p>
+<p>This will be a one day event in London on the <strong>19 November 2013</strong> running in collaboration with the <a href="http://www.graphconnect.com/london/">GraphConnect</a> event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: <strong>LDBCTUC</strong>.</p>
+<p>The TUC event will include:</p>
+<ul>
+<li>Introduction to the objectives and …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/second-tuc-meeting/">Second TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.</p>
+<p>This will be a two day event in Munich on the <strong>22/23rd April 2013</strong>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology.</li>
+<li>Industry …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/first-tuc-meeting/">First TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the <strong>19/20th November 2012</strong>.</p>
+<p>So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:</p>
+<ul>
+<li>Introduction by the coordinator and technical director explaining the objectives of the …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/event/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/event/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/event/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/event/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/second-tuc-meeting/index.html b/event/second-tuc-meeting/index.html
new file mode 100644
index 00000000..40a3572e
--- /dev/null
+++ b/event/second-tuc-meeting/index.html
@@ -0,0 +1,559 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Second TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Second TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Second TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Josep Larriba Pey</strong> / on <strong class="text-dark">25 Apr 2013</strong></div>
+        
+        
+        
+        <h5>
+          Location: Munich, Germany
+        </h5>
+        <h5>
+          
+          Event dates: 22 Apr 2013 10:00 -- 23 Apr 2021 17:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.</p>
+<p>This will be a two day event in Munich on the <strong>22/23rd April 2013</strong>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology.</li>
+<li>Industry discussions on the contents of the benchmarks.</li>
+</ul>
+<p>All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu</p>
+<ul>
+<li><a href="#agenda">Agenda</a></li>
+<li><a href="#logistics">Logistics</a>
+<ul>
+<li><a href="#date">Date</a></li>
+<li><a href="#location">Location</a></li>
+<li><a href="#venue">Venue</a>
+<ul>
+<li><a href="#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn">Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)</a></li>
+<li><a href="#getting-to-the-tum-campus-from-the-munich-airport">Getting to the TUM Campus from the Munich Airport</a></li>
+<li><a href="#getting-to-the-tum-campus-from-garching-u-bahn">Getting to the TUM Campus from Garching: U-Bahn</a></li>
+</ul>
+</li>
+<li><a href="#getting-there">Getting there</a></li>
+<li><a href="#social-dinner">Social Dinner</a></li>
+</ul>
+</li>
+</ul>
+<h3 id="agenda">Agenda</h3>
+<p><strong>April 22nd</strong></p>
+<p>10:00 <em>Registration.</em><br>
+10:30 Josep Lluis Larriba Pey (UPC) - <em>Welcome and Introduction.</em><br>
+10:30 Peter Boncz (VUA): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx">LDBC: goals and status</a></p>
+<p><em>Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)</em></p>
+<p>11:00 Josep Lluis Larriba Pey (UPC): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf">Social Network Benchmark Task Force</a><br>
+11:30 Gustavo González (Mediapro): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf">Graph-based User Modeling through Real-time Social Streams</a><br>
+12:00 Klaus Großmann (Dshini): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf">Neo4j at Dshini</a></p>
+<p>12:30 Lunch</p>
+<p><em>Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)</em></p>
+<p>13:30 Barry Bishop (Ontotext): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx">Semantic Publishing Benchmark Task Force</a><br>
+14:00 Dave Rogers (BBC): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx">Linked Data Platform at the BBC</a><br>
+14:30 Edward Thomas (Wolters Kluwer): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf">Semantic Publishing at Wolters Kluwer</a></p>
+<p>15:00 Coffee break</p>
+<p><em>Projects Related to LDBC</em></p>
+<p>15:30 Fabian Suchanek (MPI): &ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&rdquo;<br>
+16:00 Antonis Loziou (VUA): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx">The OpenPHACTS approach to data integration</a><br>
+16:30 Mirko Kämpf (Brox): &ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&rdquo;</p>
+<p>17:00 <em>End of first day</em></p>
+<p>19:00 Social dinner</p>
+<p><strong>April 23rd</strong></p>
+<p><em>Industry &amp; Hardware Aspects</em></p>
+<p>10:00 Xavier Lopez (Oracle): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf">Graph Database Performance an Oracle Perspective.pdf</a><br>
+10:30 Pedro Trancoso (University of Cyprus): &ldquo;Benchmarking and computer architecture: the research side&rdquo;</p>
+<p>11:00 Coffee break</p>
+<p><em>Future Steps and TUC feedback session</em></p>
+<p>11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force<br>
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&quot;</p>
+<p>12:30 <em>End of meeting</em></p>
+<h3 id="logistics">Logistics</h3>
+<h4 id="date">Date</h4>
+<p>22nd and 23th April 2013</p>
+<h4 id="location">Location</h4>
+<p>The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:</p>
+<p>LRZ (Leibniz-Rechenzentrum)<br>
+Boltzmannstraße 1<br>
+85748 Garching, Germany</p>
+<h4 id="venue">Venue</h4>
+<p>To reach the campus, there are several options, including Taxi and Subway <a href="http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf">Ubahn</a></p>
+<h5 id="getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn">Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)</h5>
+<p>Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.</p>
+<h5 id="getting-to-the-tum-campus-from-the-munich-airport">Getting to the TUM Campus from the Munich Airport</h5>
+<ol>
+<li>
+<p>(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.</p>
+</li>
+<li>
+<p>S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.</p>
+</li>
+<li>
+<p>Taxi: fare is ca. 30-40 euros.</p>
+</li>
+</ol>
+<p>For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.</p>
+<h5 id="getting-to-the-tum-campus-from-garching-u-bahn">Getting to the TUM Campus from Garching: U-Bahn</h5>
+<p>The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.</p>
+<p><strong>Finding LRZ@TUM</strong></p>
+<p><a href="http://www.openstreetmap.org/?mlat=48.2615702464&amp;mlon=11.6686558264&amp;zoom=32">OpenStreetMap link</a></p>
+<p><a href="https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;spn=0.005,0.005&amp;t=k">Google Maps link</a></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif" alt=""></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif" alt=""></p>
+<h4 id="getting-there">Getting there</h4>
+<p><strong>Flying: Munich</strong> airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.</p>
+<p><strong>S-Bahn:</strong> S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.</p>
+<p><strong>Taxi:</strong> taxi from the airport to the city center costs approximately 50 euros</p>
+<h4 id="social-dinner">Social Dinner</h4>
+<p>The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)</p>
+<p>Address: Hofbräuhaus, Platzl 9, Munich</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/seventeenth-tuc-meeting/index.html b/event/seventeenth-tuc-meeting/index.html
new file mode 100644
index 00000000..5282af51
--- /dev/null
+++ b/event/seventeenth-tuc-meeting/index.html
@@ -0,0 +1,572 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Seventeenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Seventeenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Seventeenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Renzo Angles</strong> / on <strong class="text-dark">18 Apr 2024</strong></div>
+        
+        
+        
+        <h5>
+          Location: Santiago de Chile
+        </h5>
+        <h5>
+          
+          Event date: 09 Jun 2024 09:00 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El Bosque Ebro</strong> (<a href="https://www.plazaelbosque.cl">https://www.plazaelbosque.cl</a>), which is two blocks away from SIGMOD&rsquo;s venue. See the map <a href="https://maps.app.goo.gl/78oiw3zo2pH3gy5R6">here</a>.</p>
+<p><strong>If you would like to participate please register using <a href="https://forms.gle/XXgaQfwBZAMMZJb78">this form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in Chile time (GMT-4).</strong></p>
+<p><strong>Each speaker will have 20 minutes for exposition plus 5 minutes for questions.</strong></p>
+<table>
+<thead>
+<tr>
+<th>Time</th>
+<th>Speaker</th>
+<th>Title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>09:00</td>
+<td>Welcome</td>
+<td>&ldquo;Canelo&rdquo; saloon</td>
+</tr>
+<tr>
+<td>09:30</td>
+<td>Alastair Green (LDBC Vice-chair)</td>
+<td>Status of the LDBC Extended GQL Schema Working Group</td>
+</tr>
+<tr>
+<td>10:00</td>
+<td>Hannes Voigt (Neo4j)</td>
+<td>Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced</td>
+</tr>
+<tr>
+<td>10:30</td>
+<td>Calin Iorgulescu (Oracle)</td>
+<td>PGX.D: Distributed graph processing engine</td>
+</tr>
+<tr>
+<td>11:00</td>
+<td>Coffee break</td>
+<td></td>
+</tr>
+<tr>
+<td>11:30</td>
+<td>Ricky Sun (Ultipa, Inc.)</td>
+<td>A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering</td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>Daan de Graaf (TU Eindhoven)</td>
+<td>Algorithm Support in a Graph Database, Done Right</td>
+</tr>
+<tr>
+<td>12:30</td>
+<td>Angela Bonifati (Lyon 1 University and IUF, France)</td>
+<td>Transforming Property Graphs</td>
+</tr>
+<tr>
+<td>13:00</td>
+<td>Brunch</td>
+<td></td>
+</tr>
+<tr>
+<td>14:00</td>
+<td>Juan Sequeda (data.world)</td>
+<td>A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&rsquo;s Accuracy for Question Answering on Enterprise SQL Databases</td>
+</tr>
+<tr>
+<td>14:30</td>
+<td>Olaf Hartig (Linköping University)</td>
+<td>FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines</td>
+</tr>
+<tr>
+<td>15:00</td>
+<td>Olaf Hartig (Amazon)</td>
+<td>Datatypes for Lists and Maps in RDF Literals</td>
+</tr>
+<tr>
+<td>15:30</td>
+<td>Peter Boncz (CWI and MotherDuck)</td>
+<td>The state of DuckPGQ</td>
+</tr>
+<tr>
+<td>16:00</td>
+<td>Coffee break</td>
+<td></td>
+</tr>
+<tr>
+<td>16:30</td>
+<td>Juan Reutter (IMFD and PUC Chile)</td>
+<td>MillenniumDB: A Persistent, Open-Source, Graph Database</td>
+</tr>
+<tr>
+<td>17:00</td>
+<td>Carlos Rojas (IMFD)</td>
+<td>WDBench: A Wikidata Graph Query Benchmark</td>
+</tr>
+<tr>
+<td>17:30</td>
+<td>Sebastián Ferrada (IMFD and Univ. de Chile)</td>
+<td>An algebra for evaluating path queries</td>
+</tr>
+<tr>
+<td>19:30</td>
+<td>Dinner</td>
+<td></td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            , <a href="/tags/santiago">SANTIAGO</a>
+            , <a href="/tags/chile">CHILE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/seventh-tuc-meeting/index.html b/event/seventh-tuc-meeting/index.html
new file mode 100644
index 00000000..6199693f
--- /dev/null
+++ b/event/seventh-tuc-meeting/index.html
@@ -0,0 +1,558 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Seventh TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Seventh TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Seventh TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Ioan Toma</strong> / on <strong class="text-dark">26 Dec 2015</strong></div>
+        
+        
+        
+        <h5>
+          Location:  IBM&#39;s TJ Watson, US
+        </h5>
+        <h5>
+          
+          Event dates: 09 Nov 2015 14:17 -- 10 Nov 2015 14:17  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="http://www.research.ibm.com/labs/watson">IBM&rsquo;s TJ Watson</a> facility on <strong>Monday and Tuesday November 9/10, 2015.</strong></p>
+<p>This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the benchmarking results for the different benchmarks.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a>; in order to notify IBM security in advance, registration requests need to be in by Nov 1.</p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.</p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.</p>
+<p>In this page, you&rsquo;ll find information about the following items:</p>
+<ul>
+<li><a href="#agenda">Agenda</a></li>
+<li><a href="#logistics">Logistics</a><br>
+- <a href="#date"><strong>Date</strong></a><br>
+- <a href="#venue"><strong>Venue</strong></a><br>
+- <a href="#maps-and-situation"><strong>Maps and situation</strong></a><br>
+- <a href="#getting-there"><strong>Getting there</strong></a></li>
+</ul>
+<h3 id="agenda">Agenda</h3>
+<p><strong>Monday, 9th of November 2015</strong></p>
+<p>8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)</p>
+<p>9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)</p>
+<p>9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)</p>
+<p>9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload</p>
+<p>10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload</p>
+<p>10:30-11:00 Coffee break</p>
+<p>11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)</p>
+<p>11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.</p>
+<p>11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.</p>
+<p>12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status</p>
+<p>12:30 - 14:00 Lunch break</p>
+<p>14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)</p>
+<p>14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox</p>
+<p>14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&rsquo;s architectures</p>
+<p>15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G</p>
+<p>15:30-16:00 Coffee break</p>
+<p>16:00 - 17:00 Technologies (chair Irini Fundulaki)</p>
+<p>16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store</p>
+<p>16:30 David Ediger (GeorgiaTech). STINGER</p>
+<p>17:00 Gary King (Franz Inc.). AllegroGraph&rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties</p>
+<p>17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics</p>
+<p>18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase</p>
+<p>19:00 Social dinner</p>
+<p><strong>Tuesday 10th November 2015</strong></p>
+<p>9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)</p>
+<p>9:00 Philip Rathle (Neo). On openCypher</p>
+<p>9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification</p>
+<p>9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions</p>
+<p>10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation</p>
+<p>10:30 - 11:00 Coffee break</p>
+<p>11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)</p>
+<p>11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL</p>
+<p>11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,</p>
+<p>11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis</p>
+<p>12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives</p>
+<p>12:30 - 14:00 Lunch break</p>
+<p>14:00 LDBC Board of Directors</p>
+<h3 id="logistics">Logistics</h3>
+<h6 id="date"><strong>Date</strong></h6>
+<p>9th and 10th November 2015</p>
+<h6 id="venue"><strong>Venue</strong></h6>
+<p>The TUC meeting will be held in the IBM Thomas J Watson Research Center.<br>
+The address is:</p>
+<p><strong>IBM Thomas J Watson Research Center</strong><br>
+<strong>1101 Kitchawan Rd,</strong><br>
+<strong>Yorktown Heights, NY 10598, USA</strong></p>
+<p>If you are using a <em>GPS system</em>, please enter <strong>&ldquo;200 Aqueduct Road, Ossining NY, 10562&rdquo;</strong> for accurate directions to the lab entrance. You may also want to check the routing online.</p>
+<p>The meeting will take place in the <em>Auditorium</em> on November 9th, and in Meeting Room <em>20-043</em> on November 10th.</p>
+<h6 id="maps-and-situation"><strong>Maps and situation</strong></h6>
+<p>You are highly suggested to <strong>rent a car</strong> for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through <a href="http://www.orbitz.com">www.orbitz.com</a>, or <a href="http://www.expedia.com">www.expedia.com</a> Feel free to email <a href="mailto:yxia@us.ibm.com">yxia@us.ibm.com</a> for any questions.</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png" alt=""></p>
+<h6 id="getting-there"><strong>Getting there</strong></h6>
+<p><strong>Upper and Eastern New England</strong></p>
+<p>Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.</p>
+<p><strong>New Haven and Connecticut Shores</strong></p>
+<p>Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.</p>
+<p><strong>New Jersey</strong></p>
+<p>Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.</p>
+<p><strong>Upstate New York</strong></p>
+<p>Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.</p>
+<p><strong>New York City (Manhattan)</strong></p>
+<p>Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.</p>
+<p><strong>John F. Kennedy International Airport</strong></p>
+<p>North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.</p>
+<p><strong>LaGuardia Airport</strong></p>
+<p>East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.</p>
+<p><strong>Newark International Airport</strong></p>
+<p>North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.</p>
+<p><strong>Stewart International Airport</strong></p>
+<p>Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.</p>
+<p><strong>Westchester County Airport</strong></p>
+<p>Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.</p>
+<p><strong>Public Transportation</strong></p>
+<p>Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/sixteenth-tuc-meeting/index.html b/event/sixteenth-tuc-meeting/index.html
new file mode 100644
index 00000000..3e6d0f83
--- /dev/null
+++ b/event/sixteenth-tuc-meeting/index.html
@@ -0,0 +1,739 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Sixteenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Sixteenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Sixteenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Oskar van Rest, Gábor Szárnyas</strong> / on <strong class="text-dark">14 Feb 2023</strong></div>
+        
+        
+        
+        <h5>
+          Location: Seattle
+        </h5>
+        <h5>
+          
+          Event dates: 23 Jun 2023 09:00 -- 24 Jun 2023 18:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p><strong>Organizers:</strong> Oskar van Rest, Alastair Green, Gábor Szárnyas</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2023.sigmod.org/venue.shtml">SIGMOD 2023</a> on <strong>June 23-24 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/T6bwVHzK9V5FaKyR9">our form</a>.</strong></p>
+<p>LDBC will host a <strong>social event</strong> on Friday at the <a href="https://www.blackbottleseattle.com/">Black Bottle gastrotavern</a> in Belltown: <a href="https://goo.gl/maps/hQzBRR2nerZEQExw7">2600 1st Ave (on the corner of Vine), Seattle, WA 98121</a>.</p>
+<p>In addition, AWS will host a <strong>Happy Hour</strong> (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&rsquo;s 8th floor deck: <a href="https://goo.gl/maps/md5kWUHaNUGhR9JB7">2205 8th Ave, Seattle, WA 98121</a>.</p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in PDT.</strong></p>
+<h4 id="friday">Friday</h4>
+<p><strong>Location:</strong> Hyatt Regency Bellevue on Seattle&rsquo;s Eastside, <strong>room Grand K</strong>, co-located with SIGMOD (<a href="https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle">900 Bellevue Way NE, Bellevue, WA 98004-4272</a>)</p>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>finish</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>08:30</td>
+<td>08:45</td>
+<td>Oskar van Rest (Oracle)</td>
+<td>LDBC – State of the union – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf">slides</a>, <a href="https://youtu.be/Frk7ITssaSY">video</a></td>
+</tr>
+<tr>
+<td>08:50</td>
+<td>09:05</td>
+<td>Keith Hare (JCC / WG3)</td>
+<td>An update on the GQL &amp; SQL/PGQ standards efforts  – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf">slides</a>, <a href="https://youtu.be/LQYkal_0j6E">video</a></td>
+</tr>
+<tr>
+<td>09:10</td>
+<td>09:25</td>
+<td>Stefan Plantikow (Neo4j / WG3)</td>
+<td>GQL - Introduction to a new query language standard – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf">slides</a></td>
+</tr>
+<tr>
+<td>09:30</td>
+<td>09:45</td>
+<td>Leonid Libkin (University of Edinburgh &amp; RelationalAI)</td>
+<td>Formalizing GQL – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf">slides</a>, <a href="https://youtu.be/YZE1a00h1I4">video</a></td>
+</tr>
+<tr>
+<td>09:50</td>
+<td>10:05</td>
+<td>Semen Panenkov (JetBrains Research)</td>
+<td>Mechanizing the GQL semantics in Coq – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf">slides</a>, <a href="https://youtu.be/5xBGohqWCzo">videos</a></td>
+</tr>
+<tr>
+<td>10:10</td>
+<td>10:25</td>
+<td>Oskar van Rest (Oracle)</td>
+<td>SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf">slides</a>, <a href="https://youtu.be/owM9WiQubpg">video</a></td>
+</tr>
+<tr>
+<td>10:30</td>
+<td>11:00</td>
+<td><em>coffee break</em></td>
+<td></td>
+</tr>
+<tr>
+<td>11:00</td>
+<td>11:15</td>
+<td>Alastair Green (JCC)</td>
+<td>LDBC&rsquo;s organizational changes and fair use policies – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf">slides</a></td>
+</tr>
+<tr>
+<td>11:20</td>
+<td>11:35</td>
+<td>Ioana Manolescu (INRIA)</td>
+<td>Integrating Connection Search in Graph Queries – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf">slides</a>, <a href="https://youtu.be/LQPnmcrkUpY">video</a></td>
+</tr>
+<tr>
+<td>11:40</td>
+<td>11:55</td>
+<td>Maciej Besta (ETH Zurich)</td>
+<td>Neural Graph Databases with Graph Neural Networks – <a href="https://youtu.be/ce5qNievRNs">video</a></td>
+</tr>
+<tr>
+<td>12:00</td>
+<td>12:10</td>
+<td>Longbin Lai (Alibaba Damo Academy)</td>
+<td>To Revisit Benchmarking Graph Analytics – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf">slides</a>, <a href="https://youtu.be/s9Vtt-6t_FI">video</a></td>
+</tr>
+<tr>
+<td>12:15</td>
+<td>13:30</td>
+<td><em>lunch</em></td>
+<td></td>
+</tr>
+<tr>
+<td>13:30</td>
+<td>13:45</td>
+<td>Yuanyuan Tian (Gray Systems Lab, Microsoft)</td>
+<td>The World of Graph Databases from An Industry Perspective – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf">slides</a>, <a href="https://youtu.be/AZuP_b95GPM">video</a></td>
+</tr>
+<tr>
+<td>13:50</td>
+<td>14:05</td>
+<td>Alin Deutsch (UC San Diego &amp; TigerGraph)</td>
+<td>TigerGraph&rsquo;s Parallel Computation Model – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf">slides</a>, <a href="https://youtu.be/vcxdieJB80Y">video</a></td>
+</tr>
+<tr>
+<td>14:10</td>
+<td>14:25</td>
+<td>Chen Zhang (CreateLink)</td>
+<td>Applications of a Native Distributed Graph Database in the Financial Industry – <a href="https://youtu.be/GCCT79Sps9I">video</a></td>
+</tr>
+<tr>
+<td>14:30</td>
+<td>14:45</td>
+<td>Ricky Sun (Ultipa)</td>
+<td>Design of highly scalable graph database systems – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf">slides</a>, <a href="https://youtu.be/Sg1F64O4vGM">video</a></td>
+</tr>
+<tr>
+<td>14:50</td>
+<td>15:30</td>
+<td><em>coffee break</em></td>
+<td></td>
+</tr>
+<tr>
+<td>15:30</td>
+<td>15:45</td>
+<td>Heng Lin (Ant Group)</td>
+<td>The LDBC SNB implementation in TuGraph – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf">slides</a>, <a href="https://youtu.be/fy8AuVerwnY">video</a></td>
+</tr>
+<tr>
+<td>15:50</td>
+<td>16:05</td>
+<td>Shipeng Qi (Ant Group)</td>
+<td>FinBench: The new LDBC benchmark targeting financial scenario – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf">slides</a>, <a href="https://youtu.be/0xLZadDOfZk">video</a></td>
+</tr>
+<tr>
+<td>16:10</td>
+<td>17:00</td>
+<td>host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)</td>
+<td>FinBench panel – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf">slides</a></td>
+</tr>
+<tr>
+<td>19:00</td>
+<td>22:00</td>
+<td><em>dinner</em></td>
+<td><em><a href="https://www.blackbottleseattle.com/">Black Bottle gastrotavern</a> in Belltown: <a href="https://goo.gl/maps/hQzBRR2nerZEQExw7">2600 1st Ave (on the corner of Vine), Seattle, WA 98121</a></em></td>
+</tr>
+</tbody>
+</table>
+<h4 id="saturday">Saturday</h4>
+<p><strong>Location:</strong> Amazon Nitro South building, <strong>room 03.204</strong> (<a href="https://goo.gl/maps/md5kWUHaNUGhR9JB7">2205 8th Ave, Seattle, WA 98121</a>)</p>
+<table>
+<thead>
+<tr>
+<th>start</th>
+<th>finish</th>
+<th>speaker</th>
+<th>title</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>09:00</td>
+<td>09:45</td>
+<td>Brad Bebee (AWS)</td>
+<td>Customers don&rsquo;t want a graph database, so why are we still here? – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf">slides</a>, <a href="https://youtu.be/bJlkpDC--fM">video</a></td>
+</tr>
+<tr>
+<td>10:00</td>
+<td>10:15</td>
+<td>Muhammad Attahir Jibril (TU Ilmenau)</td>
+<td>Fast and Efficient Update Handling for Graph H2TAP – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf">slides</a>, <a href="https://youtu.be/e8ZAszBsXV0">video</a></td>
+</tr>
+<tr>
+<td>10:20</td>
+<td>11:00</td>
+<td><em>coffee break</em></td>
+<td></td>
+</tr>
+<tr>
+<td>11:00</td>
+<td>11:15</td>
+<td>Gabor Szarnyas (CWI)</td>
+<td>LDBC Social Network Benchmark and Graphalytics – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf">slides</a></td>
+</tr>
+<tr>
+<td>11:20</td>
+<td>11:30</td>
+<td>Atanas Kiryakov and Tomas Kovachev (Ontotext)</td>
+<td>GraphDB – Benchmarking against LDBC SNB &amp; SPB – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf">slides</a>, <a href="https://youtu.be/U6OPpNFOWqg">video</a></td>
+</tr>
+<tr>
+<td>11:35</td>
+<td>11:50</td>
+<td>Roi Lipman (Redis Labs)</td>
+<td>Delta sparse matrices within RedisGraph – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf">slides</a>, <a href="https://youtu.be/qfKsplV4Ihk">video</a></td>
+</tr>
+<tr>
+<td>11:55</td>
+<td>12:05</td>
+<td>Rathijit Sen (Microsoft)</td>
+<td>Microarchitectural Analysis of Graph BI Queries on RDBMS – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf">slides</a>, <a href="https://youtu.be/55B8CkH09js">video</a></td>
+</tr>
+<tr>
+<td>12:10</td>
+<td>13:30</td>
+<td><em>lunch</em></td>
+<td><em>on your own</em></td>
+</tr>
+<tr>
+<td>13:30</td>
+<td>13:45</td>
+<td>Alastair Green (JCC)</td>
+<td>LEX &ndash; LDBC Extended GQL Schema – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf">slides</a>, <a href="https://youtu.be/DVpeb4Ce9Uw">video</a></td>
+</tr>
+<tr>
+<td>13:50</td>
+<td>14:05</td>
+<td>Ora Lassila (AWS)</td>
+<td>Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf">slides</a>, <a href="https://youtu.be/7uAInoUwdds">video</a></td>
+</tr>
+<tr>
+<td>14:10</td>
+<td>14:25</td>
+<td>Jan Hidders (Birkbeck, University of London)</td>
+<td>PG-Schema: a proposal for a schema language for property graphs – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf">slides</a>, <a href="https://youtu.be/yQNL8hBTE4M">video</a></td>
+</tr>
+<tr>
+<td>14:30</td>
+<td>14:45</td>
+<td>Max de Marzi (RageDB and RelationalAI)</td>
+<td>RageDB: Building a Graph Database in Anger – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf">slides</a>, <a href="https://youtu.be/LBbF8aslYFE">video</a></td>
+</tr>
+<tr>
+<td>14:50</td>
+<td>15:30</td>
+<td><em>coffee break</em></td>
+<td></td>
+</tr>
+<tr>
+<td>15:30</td>
+<td>15:45</td>
+<td>Umit Catalyurek (AWS)</td>
+<td>HPC Graph Analytics on the OneGraph Model – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf">slides</a>, <a href="https://youtu.be/64tv5LA6Wr8">video</a></td>
+</tr>
+<tr>
+<td>15:50</td>
+<td>16:05</td>
+<td>David J. Haglin (Trovares)</td>
+<td>How LDBC impacts Trovares – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf">slides</a>, <a href="">video</a></td>
+</tr>
+<tr>
+<td>16:10</td>
+<td>16:25</td>
+<td>Wenyuan Yu (Alibaba Damo Academy)</td>
+<td>GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf">slides</a>, <a href="https://youtu.be/cRikoyDmMks">video</a></td>
+</tr>
+<tr>
+<td>16:30</td>
+<td>16:40</td>
+<td>Scott McMillan (Carnegie Mellon University)</td>
+<td>Graph processing using GraphBLAS – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf">slides</a>, <a href="https://youtu.be/yb4hGBhUzQQ">video</a></td>
+</tr>
+<tr>
+<td>16:45</td>
+<td>16:55</td>
+<td>Tim Mattson (Intel)</td>
+<td>Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf">slides</a></td>
+</tr>
+<tr>
+<td>17:00</td>
+<td>20:00</td>
+<td><em>happy hour (rooftop grill with beverages)</em></td>
+<td><em>on the Nitro South building&rsquo;s 8th floor deck</em></td>
+</tr>
+</tbody>
+</table>
+<h4 id="tuc-event-locations">TUC event locations</h4>
+<p>A <a href="https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo">map of the LDBC TUC events</a> we hosted so far.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/sixth-tuc-meeting/index.html b/event/sixth-tuc-meeting/index.html
new file mode 100644
index 00000000..5a4f8191
--- /dev/null
+++ b/event/sixth-tuc-meeting/index.html
@@ -0,0 +1,528 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Sixth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Sixth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Sixth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark"></strong> / on <strong class="text-dark">23 Apr 2015</strong></div>
+        
+        
+        
+        <h5>
+          Location: Barcelona, March
+        </h5>
+        <h5>
+          
+          Event dates: 19 Mar 2015 13:53 -- 20 Mar 2015 13:53  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on <strong>Thursday and Friday March 19/20, 2015.</strong></p>
+<p>The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the first benchmarking results for the different benchmarks.</li>
+<li>Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.</li>
+<li>Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.</li>
+</ul>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a>.</p>
+<h3 id="agenda">Agenda</h3>
+<p><strong>Thursday 19th March</strong></p>
+<p>11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)</p>
+<p>11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf">slides</a></p>
+<p>12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)</p>
+<p>12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf">slides</a></p>
+<p>12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain</p>
+<p>12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive</p>
+<p>13:10 Claudio Martella (VUA): Giraph and Lighthouse</p>
+<p>13:30 - 14:30 Lunch break</p>
+<p>14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)</p>
+<p>14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf">slides</a></p>
+<p>14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf">slides</a></p>
+<p>15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf">slides</a></p>
+<p>15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs</p>
+<p>18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.</p>
+<p>20:00 Social dinner at <a href="http://www.bastaix.com">Bastaix Restaurant</a>.</p>
+<p><strong>Friday 20th March</strong></p>
+<p>9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)</p>
+<p>9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics</p>
+<p>9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms</p>
+<p>10:10 John Snelson (MarkLogic): Introduction to MarkLogic</p>
+<p>10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload</p>
+<p>10:50 Moritz Kaufmann. <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf">The auditing experience</a></p>
+<p>11:15 - 11:45 Coffee break</p>
+<p>11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)</p>
+<p>11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox</p>
+<p>12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data</p>
+<p>12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments</p>
+<p>12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf">slides</a></p>
+<p>13:30 - 14:30 Lunch break</p>
+<p>15:00  LDBC Board of Directors</p>
+<h3 id="logistics">Logistics</h3>
+<h6 id="date"><strong>Date</strong></h6>
+<p>19th and 20th March 2015</p>
+<h6 id="venue"><strong>Venue</strong></h6>
+<p>The TUC meeting will be held at &ldquo;Aula Master&rdquo; at A3 building located inside the &ldquo;Campus Nord UPC&rdquo; in Barcelona. The address is:</p>
+<p>Aula Master<br>
+Edifici A3, Campus Nord UPC<br>
+C. Jordi Girona, 1-3<br>
+08034 Barcelona, Spain</p>
+<h5 id="maps-and-situation"><strong>Maps and situation</strong></h5>
+<p>To reach the campus, there are several options, including Taxi, <a href="http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;groupId=10168">Metro</a> and <a href="http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;groupId=10168">Bus</a>.</p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg" alt=""></p>
+<h5 id="finding-upc"><strong>Finding UPC</strong></h5>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg" alt=""></p>
+<h5 id="finding-the-meeting-room"><strong>Finding the meeting room</strong></h5>
+<h5 id="getting-there">Getting there</h5>
+<p><strong>Flying:</strong> Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this <a href="http://goo.gl/maps/iJqlj">map of the airport</a>). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.</p>
+<p><strong>Rail:</strong> The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to<br>
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.</p>
+<p><strong>Bus:</strong> The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.</p>
+<p><strong>Taxi:</strong> From the airport, you can take one of Barcelona&rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.</p>
+<p><strong>Train and bus:</strong> Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: <a href="http://www.barcelona-airport.com/eng/transport_eng.htm">http://www.barcelona-airport.com/eng/transport_eng.htm</a></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg" alt=""></p>
+<h5 id="the-locations-of-the-airport-and-the-city-centre"><strong>The locations of the airport and the city centre</strong></h5>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/tenth-tuc-meeting/index.html b/event/tenth-tuc-meeting/index.html
new file mode 100644
index 00000000..34c09334
--- /dev/null
+++ b/event/tenth-tuc-meeting/index.html
@@ -0,0 +1,515 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Tenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Tenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Tenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">05 Nov 2017</strong></div>
+        
+        
+        
+        <h5>
+          Location: 
+        </h5>
+        <h5>
+          
+          Event date: 01 Sep 2017 10:30 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>This will be a one-day event at the <a href="http://www.vldb.org/2017">VLDB 2017</a> conference in Munich, Germany on September 1, 2017.</p>
+<p>Topics and activities of interest in these TUC meetings are:</p>
+<ul>
+<li>Presentation on graph data management usage scenarios.</li>
+<li>Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at <a href="mailto:adiaz@ac.upc.edu">adiaz@ac.upc.edu</a> to register; registration is free, but required.</p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.</p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.</p>
+<h3 id="agenda">Agenda</h3>
+<p>In the TUC meeting there will be:</p>
+<ul>
+<li>updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.</li>
+<li>talks by data management practitioners highlighting graph data management challenges</li>
+<li>selected scientific talks on graph data management technology</li>
+</ul>
+<p>The meeting will start on Friday morning, with a program from 10:30-17:00</p>
+<p>10:30-12:00:  TUC session (public)</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf">Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal</a> (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx">pptx</a>)</li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf">Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload</a></li>
+<li>Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf">LDBC Graphalytics v0.9</a>, <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf">Graphalytics Global Competition and Graphalytics Custom Benchmark</a></li>
+</ul>
+<p>12:00-13:30:  lunch break</p>
+<p>13:30-15:00:  TUC session (public)</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf">Arnau Prat (UPC): Datasynth: Democratizing property graph generation</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf">Marcus Paradies (SAP): SAP HANA GraphScript</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf">Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform</a></li>
+<li>Gaétan Hains (Huawei): Cost semantics for graph queries</li>
+</ul>
+<p>15:00-15:30:  break</p>
+<p>15:30-17:00:  TUC session (public)</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf">Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf">Markus Kaindl (Springer): SN SciGraph &ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain</a></li>
+<li>Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks</li>
+<li>Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset</li>
+</ul>
+<p>Speakers should aim for a <strong>20-minute talk</strong>.</p>
+<p>Further:</p>
+<ul>
+<li>on Friday evening (19:00-21:00) there will be a <strong>social dinner</strong> at <a href="https://www.loewenbraeukeller.com/en/pub-and-beer-garden/">Löwenbräukeller</a>, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).</li>
+<li>on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.</li>
+</ul>
+<h3 id="venue">Venue</h3>
+<p>The Technical University of Munich (TUM) is hosting that week the <a href="http://www.vldb.org/2017">VLDB conference</a>; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.</p>
+<p>The TUC meeting will be held in in <strong>Room 2607</strong> alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).</p>
+<p><strong>address: Technische Universität München (TUM), Arcisstraße 21, 80333 München</strong></p>
+<p><a href="https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en">Google Maps</a></p>
+<p><img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg" alt=""><br>
+<img src="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg" alt=""></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/third-tuc-meeting/index.html b/event/third-tuc-meeting/index.html
new file mode 100644
index 00000000..060f73ea
--- /dev/null
+++ b/event/third-tuc-meeting/index.html
@@ -0,0 +1,603 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Third TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Third TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Third TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">04 Apr 2021</strong></div>
+        
+        
+        
+        <h5>
+          Location: London, United Kingdom
+        </h5>
+        <h5>
+          
+          Event date: 19 Nov 2013 08:00 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!</p>
+<p>This will be a one day event in London on the <strong>19 November 2013</strong> running in collaboration with the <a href="http://www.graphconnect.com/london/">GraphConnect</a> event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: <strong>LDBCTUC</strong>.</p>
+<p>The TUC event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology</li>
+<li>Industry discussions on the contents of the benchmarks</li>
+</ul>
+<p>We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.</p>
+<p>We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.</p>
+<p>All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu</p>
+<ul>
+<li><a href="#agenda">Agenda</a></li>
+<li><a href="#logistics">Logistics</a></li>
+<li><a href="#ldbctuc-background">LDBC/TUC Background</a>
+<ul>
+<li><a href="#social-network-benchmark">Social Network Benchmark</a></li>
+<li><a href="#semantic-publishing-benchmark">Semantic Publishing Benchmark</a></li>
+</ul>
+</li>
+</ul>
+<h3 id="agenda">Agenda</h3>
+<p><strong>November 19th - Public TUC Meeting</strong></p>
+<p>8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)</p>
+<p>short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)</p>
+<p>NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.</p>
+<p>10:00 TUC Meeting Opening (Peter Boncz)</p>
+<p>10:10 TUC Presentations (RDF Application Descriptions)</p>
+<ul>
+<li>Johan Hjerling (BBC): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf">BBC Linked Data and the Semantic Publishing Benchmark</a></strong></em></li>
+<li>Andreas Both (Unister): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf">Ontology-driven applications in an e-commerce context</a></strong></em></li>
+<li>Nuno Carvalho (Fujitsu Laboratories Europe): <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf"><em><strong>Fujitsu RDF use cases and benchmarking requirements</strong></em></a></li>
+<li>Robina Clayphan (Europeana): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt">Europeana and Open Data</a></strong></em></li>
+</ul>
+<p>11:30 Semantic Publishing Benchmark (SPB)</p>
+<ul>
+<li>Venelin Kotsev (Ontotext - LDBC): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf">Semantic Publishing Benchmark Task Force Update</a></strong></em> and <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf">report</a></strong></em></li>
+</ul>
+<p>12:00-13:00 Lunch at the Graph Connect venue</p>
+<p><em>Talks During Lunch:</em></p>
+<ul>
+<li>Pedro Furtado, Jorge Bernardino (Univ. Coimbra): <strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf">KEYSTONE Cost Action</a></strong></li>
+</ul>
+<p>13:00 TUC Presentations (Graph Application Descriptions)</p>
+<ul>
+<li>Minqi Zhou / Weining Qian (East China Normal University): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf">Elastic and realistic social media data generation</a></strong></em></li>
+<li>Andrew Sherlock (Shapespace): <em><strong>Shapespace Use Case</strong></em></li>
+<li>Sebastian Verheughe (Telenor): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf">Real-time Resource Authorization</a></strong></em></li>
+</ul>
+<p>14:00 Social Network Benchmark (SNB)</p>
+<ul>
+<li>Norbert Martinez (UPC - LDBC): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf">Social Network Benchmark Task Force Update</a></strong></em> and <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf">Report</a></li>
+</ul>
+<p><em>14:30 Break</em></p>
+<p>14:45 TUC Presentations (Graph Analytics)</p>
+<ul>
+<li>Keith Houck (IBM): <em><strong>Benchmarking experiences with [System G Native Store (tentative title)]</strong></em></li>
+<li>Abraham Bernstein (University of Zurich): <em><strong>Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store</strong></em></li>
+<li>Luis Ceze (University of Washington): <em><strong>Grappa and GraphBench Status Update</strong></em></li>
+</ul>
+<p><em>15:45 Break</em></p>
+<p>16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*</p>
+<ul>
+<li>Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): <em><strong>CIDOC-CRM</strong></em></li>
+<li>Atanas Kiryakov (Ontotext): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf">Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)</a></strong></em></li>
+<li>Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): <em><strong><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf">Geographica: A Benchmark for Geospatial RDF Stores</a></strong></em></li>
+<li>Xavier Lopez (Oracle): <em><strong>W3C Property Graph progress</strong></em></li>
+<li>Thomas Scharrenbach (University Zurich) <em><strong>PCKS:  Benchmarking Semantic Flow Processing Systems</strong></em></li>
+</ul>
+<p>17:20 Meeting Conclusion (Josep Larriba Pey)</p>
+<p>17:30 End of TUC meeting</p>
+<p>19:00 Social dinner</p>
+<p><strong>November 20th - Internal LDBC Meeting</strong></p>
+<p>10:00 Start</p>
+<p>12:30 <em>End of meeting</em></p>
+<ul>
+<li>coffee and lunch provided</li>
+</ul>
+<h3 id="logistics">Logistics</h3>
+<p><strong>Date</strong></p>
+<p>19th November 2013</p>
+<p><strong>Location</strong></p>
+<p>The TUC meeting will be held in <strong>The Tower</strong> hotel (<a href="http://goo.gl/qZt8Fz">Google Maps link</a>) approximately 4 minutes walk from the <a href="http://www.graphconnect.com/london/">GraphConnect</a> conference in London.</p>
+<p>Getting there</p>
+<ul>
+<li>From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.</li>
+<li>From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf">See attached</a>.</li>
+</ul>
+<h3 id="ldbctuc-background">LDBC/TUC Background</h3>
+<p>Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:</p>
+<ul>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf">LDBC_SNB_Report_Nov2013.pdf</a></li>
+<li><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf">LDBC_SPB_Report_Nov2013.pdf</a></li>
+</ul>
+<p>A summary of these efforts can be read below or, for a more detailed account, please refer to: <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf">The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort</a>. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.</p>
+<h4 id="social-network-benchmark">Social Network Benchmark</h4>
+<p>The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:</p>
+<ul>
+<li>it should be understandable, and the relevance of managing such data should be understandable</li>
+<li>it should cover the complete range of interesting challenges, according to the benchmark scope</li>
+<li>the queries should be realistic, i.e., similar data and workloads are encountered in practice</li>
+</ul>
+<p>SNB includes a data generator for creation of synthetic social network data with the following characteristics:</p>
+<ul>
+<li>data schema is representative of real social networks</li>
+<li>data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions</li>
+<li>the software generator is easy-to-use, configurable and scalable</li>
+</ul>
+<p>SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:</p>
+<ul>
+<li><strong>Interactive</strong>
+<ul>
+<li>Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.</li>
+<li>The targeted systems are expected to be those that offer transactional functionality.</li>
+</ul>
+</li>
+<li><strong>Business Intelligence</strong>
+<ul>
+<li>Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.</li>
+<li>The targeted systems are expected to be those that offer an abstract query language.</li>
+</ul>
+</li>
+<li><strong>Graph Analytics</strong>
+<ul>
+<li>Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.</li>
+<li>Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.</li>
+<li>The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.</li>
+</ul>
+</li>
+</ul>
+<h4 id="semantic-publishing-benchmark">Semantic Publishing Benchmark</h4>
+<p>The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.</p>
+<p>The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.</p>
+<p>The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.</p>
+<p>Two separate workloads are modeled in SPB:</p>
+<ul>
+<li><strong>Editorial:</strong> Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.</li>
+<li><strong>Aggregation:</strong> Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &ldquo;dynamic&rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.</li>
+</ul>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf">Status of the Semantic Publishing Benchmark</a></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/thirteenth-tuc-meeting/index.html b/event/thirteenth-tuc-meeting/index.html
new file mode 100644
index 00000000..b72fba04
--- /dev/null
+++ b/event/thirteenth-tuc-meeting/index.html
@@ -0,0 +1,485 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Thirteenth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Thirteenth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Thirteenth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">26 Jun 2020</strong></div>
+        
+        
+        
+        <h5>
+          Location: Online (Zoom)
+        </h5>
+        <h5>
+          
+          Event dates: 30 Jun 2020 14:00 -- 01 Jul 2020 17:00  (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.</p>
+<p>This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.</p>
+<h3 id="snb-task-force">SNB Task Force</h3>
+<ul>
+<li>Progress report
+<ul>
+<li>ACID compliance test suite</li>
+<li>Integrating deletions to Datagen</li>
+<li>Migrating Datagen to Spark</li>
+<li>Redesign of BI read queries</li>
+<li>Extensions to the driver</li>
+</ul>
+</li>
+<li>Ongoing work
+<ul>
+<li>Datagen: tuning the distribution of deletes</li>
+<li>Interactive 2.0 workload</li>
+<li>BI 1.0 workload</li>
+</ul>
+</li>
+</ul>
+<p>Zoom links will be sent through email.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/event/twelfth-tuc-meeting/index.html b/event/twelfth-tuc-meeting/index.html
new file mode 100644
index 00000000..15ce55a0
--- /dev/null
+++ b/event/twelfth-tuc-meeting/index.html
@@ -0,0 +1,536 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Twelfth TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Twelfth TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Twelfth TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark"></strong> / on <strong class="text-dark">11 Jul 2019</strong></div>
+        
+        
+        
+        <h5>
+          Location: Amsterdam, the Netherlands
+        </h5>
+        <h5>
+          
+          Event date: 05 Jul 2019 08:30 (local timezone)
+          
+        </h5>
+        <div class="content">
+          <p>LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.</p>
+<p>This TUC meeting will be a one-day event on the last Friday of <strong><a href="https://sigmod2019.org/">SIGMOD/PODS 2019</a></strong> in Amsterdam, The Netherlands, in the conference venue of <strong><a href="http://sigmod2019.org/conf_venue">Beurs van Berlage</a></strong>. The room is the Mendes da Silva kamer. Please check its tips for <strong><a href="http://sigmod2019.org/accommodation">accommodation in Amsterdam</a></strong>.</p>
+<p>Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called <a href="https://sites.google.com/site/gradesnda2019">GRADES-NDA 2019</a>, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).</p>
+<p>We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at <a href="mailto:damaris@ac.upc.edu">damaris@ac.upc.edu</a> to register.</p>
+<p><strong>=&gt; registration is free, but required &lt;=</strong></p>
+<p>You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.</p>
+<p>In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.</p>
+<p><strong>Talk proposals can be sent to Peter Boncz</strong>, who is also the local organizer. <strong>Please also send your slides to this email for archiving on this site.</strong></p>
+<p>Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.</p>
+<h3 id="agenda">Agenda</h3>
+<p>In the TUC meeting, there will be:</p>
+<ul>
+<li>updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.</li>
+<li>talks by data management practitioners highlighting graph data management challenges and products</li>
+</ul>
+<p>The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).</p>
+<p>The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (<strong>room: Mendes da Silva kamer</strong>):</p>
+<p>08:30-10:30 LDBC Board Meeting (non-public)</p>
+<p>10:30-11:00 Coffee</p>
+<p>11:00-12:45 Session 1: Graph Benchmarks</p>
+<ul>
+<li>
+<p>11:00-11:05 Welcome &amp; introduction</p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf">11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf">11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf">12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf">12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics</a></p>
+</li>
+</ul>
+<p>12:45-14:00 Lunch</p>
+<p>14:00-16:05 Session 2: Graph Query Languages</p>
+<ul>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf">14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf">14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features</a>, <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf">report</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf">14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf">15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&rsquo;s query language</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf">15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language</a></p>
+</li>
+</ul>
+<p>16:05-16:30 Coffee</p>
+<p>16:30-17:50 Session 3: Graph System Performance</p>
+<ul>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf">16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf">16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity</a> <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx">pptx</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf">17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph</a></p>
+</li>
+<li>
+<p><a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf">17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data</a></p>
+</li>
+</ul>
+<p>If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/tuc-meeting">TUC MEETING</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/events/index.html b/events/index.html
new file mode 100644
index 00000000..7803d855
--- /dev/null
+++ b/events/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html>
+<head>
+  <title>/event</title>
+  <link rel="canonical" href="https://ldbcouncil.org/event"/>
+  <meta name="robots" content="noindex">
+  <meta charset="utf-8" />
+  <meta http-equiv="refresh" content="0; url=/event" />
+  </head>
+</html>
diff --git a/gql-community/elwg/index.html b/gql-community/elwg/index.html
new file mode 100644
index 00000000..6bc06c8f
--- /dev/null
+++ b/gql-community/elwg/index.html
@@ -0,0 +1,387 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Existing Languages Working Group (ELWG)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Existing Languages Working Group (ELWG)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Existing Languages Working Group (ELWG)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <ul>
+<li><strong>Group leader:</strong> Petra Selmer (Neo4j)</li>
+<li><strong>Focus:</strong> Surveying existing graph query languages</li>
+</ul>
+<h4 id="group-members">Group members</h4>
+<ul>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Frank Celler (ArangoDB)</li>
+<li>Victor Lee (TigerGraph)</li>
+<li>Harsh Thakkar (Consultant OSTHUS GmBH)</li>
+<li>Jeffrey Lovitz (RedisGraph)</li>
+<li>Renzo Angles (Universidad de Talca)</li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<section class="section bg-gray bg-dots">
+  <div class="container">
+    <div class="row">
+      <div class="col-12 text-center">
+        <div class="section-title-border border-center"></div>
+        <h2 class="section-title">Latest Working Group Updates</h2>
+      </div>
+      <div class="col-10 mx-auto">
+    <h4 class="mb-4"></h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">
+          <h4 class="mt-0">Launching open-source language tools for ISO/IEC GQL</h4>
+        </a>
+        09 May 2024
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and …</p>
+      </div>
+      
+      
+    </div>
+    
+      </div>
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/fswg/index.html b/gql-community/fswg/index.html
new file mode 100644
index 00000000..48985e2c
--- /dev/null
+++ b/gql-community/fswg/index.html
@@ -0,0 +1,378 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Formal Semantics Working Group (FSWG)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Formal Semantics Working Group (FSWG)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Formal Semantics Working Group (FSWG)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <ul>
+<li><strong>Group leaders:</strong> Leonid Libkin (ENS Paris, University of Edinburgh), Paolo Guagliardo (University of Edinburgh)</li>
+<li><strong>Focus:</strong> Establishing formal semantics for the upcoming GQL language</li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<section class="section bg-gray bg-dots">
+  <div class="container">
+    <div class="row">
+      <div class="col-12 text-center">
+        <div class="section-title-border border-center"></div>
+        <h2 class="section-title">Latest Working Group Updates</h2>
+      </div>
+      <div class="col-10 mx-auto">
+    <h4 class="mb-4"></h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">
+          <h4 class="mt-0">Launching open-source language tools for ISO/IEC GQL</h4>
+        </a>
+        09 May 2024
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and …</p>
+      </div>
+      
+      
+    </div>
+    
+      </div>
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/index.html b/gql-community/index.html
new file mode 100644
index 00000000..72cec386
--- /dev/null
+++ b/gql-community/index.html
@@ -0,0 +1,777 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/">Posts</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/index.xml b/gql-community/index.xml
new file mode 100644
index 00000000..6a5790a5
--- /dev/null
+++ b/gql-community/index.xml
@@ -0,0 +1,5467 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Gql-communities on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/gql-community/</link>
+    <description>Recent content in Gql-communities on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright><atom:link href="https://ldbcouncil.org/gql-community/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/gql-community/lex/index.html b/gql-community/lex/index.html
new file mode 100644
index 00000000..cd0c32d9
--- /dev/null
+++ b/gql-community/lex/index.html
@@ -0,0 +1,378 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Extended GQL Schema (LEX) working group</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Extended GQL Schema (LEX) working group</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Extended GQL Schema (LEX) working group</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p><strong>Group leader:</strong> Alastair Green (JCC)</p>
+<p><strong>Active members:</strong></p>
+<ul>
+<li>Koji Annoura</li>
+<li>Michael Behrisch</li>
+<li>Stephen Cannan</li>
+<li>Alin Deutsch</li>
+<li>George Fletcher</li>
+<li>Thomas Friesendal</li>
+<li>Denise Gosnell</li>
+<li>Alastair Green</li>
+<li>Cole Greer</li>
+<li>Zhihui Guo</li>
+<li>Keith Hare</li>
+<li>Jan Hidders</li>
+<li>Longbin Lai</li>
+<li>Heng Lin</li>
+<li>Alessandro Mosca</li>
+<li>Stefan Plantikow</li>
+<li>Yuya Sasaki</li>
+<li>Ognjen Savkovic</li>
+<li>Michael Schmidt</li>
+<li>Dominik Tomaszuk</li>
+<li>Yang Xia</li>
+<li>Wenyuan Yu</li>
+<li>Tao Wang</li>
+<li>Dušan Živkovic</li>
+<li>and <strong>15+ observers</strong></li>
+</ul>
+<p>See the <a href="https://doi.org/10.54285/ldbc.VSBC2149">LEX work charter</a> which details the group&rsquo;s mission, motivation, and scope of work.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/overview/index.html b/gql-community/overview/index.html
new file mode 100644
index 00000000..3c266ddf
--- /dev/null
+++ b/gql-community/overview/index.html
@@ -0,0 +1,361 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Graph Query Working Groups</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Graph Query Working Groups</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Graph Query Working Groups</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>LDBC&rsquo;s working groups investigate research questions on graph query languages and language extensions for graphs.<br>
+Their work targeted the <a href="https://www.iso.org/standard/79473.html">ISO/IEC SQL/PGQ language extension</a> (released in June 2023) and the <a href="https://www.iso.org/standard/76120.html">ISO/IEC GQL language</a> (released in April 2024).<br>
+LDBC has released <a href="/pages/opengql-announce/">open GQL language tools</a> in May 2024.</p>
+<h2 id="active-working-groups">Active Working Groups</h2>
+<ul>
+<li><a href="/gql-community/lex">LDBC Extended GQL Schema (LEX) working group</a></li>
+</ul>
+<h2 id="historical-working-groups">Historical Working Groups</h2>
+<ul>
+<li><a href="/gql-community/pgswg">Property Graph Schema Working Group</a></li>
+<li><a href="/gql-community/elwg">Existing Languages Working Group</a></li>
+<li><a href="/gql-community/fswg">Formal Semantics Working Group</a></li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/1/index.html b/gql-community/page/1/index.html
new file mode 100644
index 00000000..7780d3ca
--- /dev/null
+++ b/gql-community/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/gql-community/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/gql-community/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/gql-community/">
+  </head>
+</html>
diff --git a/gql-community/page/2/index.html b/gql-community/page/2/index.html
new file mode 100644
index 00000000..539d7012
--- /dev/null
+++ b/gql-community/page/2/index.html
@@ -0,0 +1,804 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/3/index.html b/gql-community/page/3/index.html
new file mode 100644
index 00000000..8b688406
--- /dev/null
+++ b/gql-community/page/3/index.html
@@ -0,0 +1,796 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/4/index.html b/gql-community/page/4/index.html
new file mode 100644
index 00000000..d66ab584
--- /dev/null
+++ b/gql-community/page/4/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/5/index.html b/gql-community/page/5/index.html
new file mode 100644
index 00000000..395d57ae
--- /dev/null
+++ b/gql-community/page/5/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/6/index.html b/gql-community/page/6/index.html
new file mode 100644
index 00000000..242529ba
--- /dev/null
+++ b/gql-community/page/6/index.html
@@ -0,0 +1,776 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/7/index.html b/gql-community/page/7/index.html
new file mode 100644
index 00000000..6c148158
--- /dev/null
+++ b/gql-community/page/7/index.html
@@ -0,0 +1,794 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/8/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/page/8/index.html b/gql-community/page/8/index.html
new file mode 100644
index 00000000..92e0c9e5
--- /dev/null
+++ b/gql-community/page/8/index.html
@@ -0,0 +1,709 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Gql communities</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Gql-communities</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Gql-communities</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/gql-community/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/gql-community/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/gql-community/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/gql-community/pgswg/index.html b/gql-community/pgswg/index.html
new file mode 100644
index 00000000..12de0366
--- /dev/null
+++ b/gql-community/pgswg/index.html
@@ -0,0 +1,511 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Property Graph Schema Working Group (PGSWG)</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Property Graph Schema Working Group (PGSWG)</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Property Graph Schema Working Group (PGSWG)</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p><strong>Group leaders:</strong> Jan Hidders (Birkbeck College, University of London), Juan Sequeda (data.world)</p>
+<p>The PGSWG has 4 sub-groups: PG-Basic, PG-Constraints, PG-Properties, PG-Nulls</p>
+<h2 id="pg-basic">PG-Basic</h2>
+<ul>
+<li><strong>Group leader:</strong> Jan Hidders (Birkbeck College, University of London)</li>
+<li><strong>Focus:</strong> Basic constructs and semantics</li>
+</ul>
+<h4 id="group-members">Group members</h4>
+<ul>
+<li>Alastair Green (JCC Consulting; Birkbeck College, University of London)</li>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Bei Li (Google)</li>
+<li>Dominik Tomaszuk (University of Bialystok)</li>
+<li>Enrico Franconi (Free University of Bozen-Bolzano)</li>
+<li>George Fletcher (Eindhoven TU)</li>
+<li>Gilles Privat (Orange S.A.)</li>
+<li>Hannes Voigt (Neo4j)</li>
+<li>Harsh Thakkar (Consultant OSTHUS GmBH)</li>
+<li>Jan Hidders (Birkbeck College, University of London)</li>
+<li>Jason Crawford (Amazon)</li>
+<li>Josh Perryman (VeracityID)</li>
+<li>Joshua Shinavier (LinkedIn)</li>
+<li>Juan Sequeda (data.world)</li>
+<li>Keith W. Hare (JCC Consulting)</li>
+<li>Koji Annoura (UTI, Inc.)</li>
+<li>Leonid Libkin (ENS Paris, University of Edinburgh)</li>
+<li>Liat Peterfreund (ENS Paris)</li>
+<li>Michael Schmidt (Amazon Web Services)</li>
+<li>Renzo Angles (Universidad de Talca)</li>
+<li>Slawek Staworko (Université de Lille)</li>
+<li>Stefania Dumbrava (Ecole Nationale Supérieure d&rsquo;Informatique pour l&rsquo;Industrie et l&rsquo;Entreprise (ENSIIE))</li>
+<li>Victor Lee (TigerGraph)</li>
+<li>Victor Marsault (CNRS)</li>
+<li>Wim Martens (University of Bayreuth)</li>
+<li>Wook-Shin Han (POSTECH)</li>
+</ul>
+<h2 id="pg-constraints">PG-Constraints</h2>
+<ul>
+<li><strong>Group leader:</strong> George Fletcher (TU Eindhoven)</li>
+<li><strong>Focus:</strong> Key constraints and cardinality constraints</li>
+</ul>
+<h4 id="group-members-1">Group members</h4>
+<ul>
+<li>Alastair Green (JCC Consulting; Birkbeck College, University of London)</li>
+<li>Andrea Cali (Birkbeck College, University of London)</li>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Bei Li (Google)</li>
+<li>Borislav Iordanov (Kobrix)</li>
+<li>Dominik Tomaszuk (University of Bialystok)</li>
+<li>Enrico Franconi (Free University of Bozen-Bolzano)</li>
+<li>Filip Murlak (University of Warsaw)</li>
+<li>George Fletcher (Eindhoven TU)</li>
+<li>Jan Hidders (Birkbeck College, University of London)</li>
+<li>Jason Crawford (Amazon)</li>
+<li>Josh Perryman (VeracityID)</li>
+<li>Juan Sequeda (data.world)</li>
+<li>Keith W. Hare (JCC Consulting)</li>
+<li>Koji Annoura (UTI, Inc.)</li>
+<li>Leonid Libkin (ENS Paris, University of Edinburgh)</li>
+<li>Michael Schmidt (Amazon Web Services)</li>
+<li>Slawek Staworko (Université de Lille)</li>
+<li>Stefania Dumbrava (Ecole Nationale Supérieure d&rsquo;Informatique pour l&rsquo;Industrie et l&rsquo;Entreprise (ENSIIE))</li>
+<li>Wim Martens (University of Bayreuth)</li>
+<li>Wook-Shin Han (POSTECH)</li>
+</ul>
+<h2 id="pg-properties">PG-Properties</h2>
+<ul>
+<li><strong>Group leader:</strong> Joshua Shinavier (LinkedIn)</li>
+<li><strong>Focus:</strong> Data types for properties</li>
+</ul>
+<h4 id="group-members-2">Group members</h4>
+<ul>
+<li>Alastair Green (JCC Consulting; Birkbeck College, University of London)</li>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Bei Li (Google)</li>
+<li>Borislav Iordanov (Kobrix)</li>
+<li>Dominik Tomaszuk (University of Bialystok)</li>
+<li>Enrico Franconi (Free University of Bozen-Bolzano)</li>
+<li>Filip Murlak (University of Warsaw)</li>
+<li>George Fletcher (Eindhoven TU)</li>
+<li>Gilles Privat (Orange S.A.)</li>
+<li>Harsh Thakkar (Consultant OSTHUS GmBH)</li>
+<li>Jan Hidders (Birkbeck College, University of London)</li>
+<li>Jason Crawford (Amazon)</li>
+<li>Josh Perryman (VeracityID)</li>
+<li>Joshua Shinavier (LinkedIn)</li>
+<li>Juan Sequeda (data.world)</li>
+<li>Keith W. Hare (JCC Consulting)</li>
+<li>Koji Annoura (UTI, Inc.)</li>
+<li>Michael Schmidt (Amazon Web Services)</li>
+<li>Renzo Angles (Universidad de Talca)</li>
+<li>Stefania Dumbrava (Ecole Nationale Supérieure d&rsquo;Informatique pour l&rsquo;Industrie et l&rsquo;Entreprise (ENSIIE))</li>
+<li>Victor Lee (TigerGraph)</li>
+<li>Victor Marsault (CNRS)</li>
+<li>Wim Martens (University of Bayreuth)</li>
+<li>Wook-Shin Han (POSTECH)</li>
+</ul>
+<h2 id="pg-nulls">PG-Nulls</h2>
+<ul>
+<li><strong>Group leader:</strong> Angela Bonifati (Lyon 1 University)</li>
+<li><strong>Focus:</strong> Null values</li>
+</ul>
+<h4 id="group-members-3">Group members</h4>
+<ul>
+<li>Alastair Green (JCC Consulting; Birkbeck College, University of London)</li>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Dominik Tomaszuk (University of Bialystok)</li>
+<li>Enrico Franconi (Free University of Bozen-Bolzano)</li>
+<li>Filip Murlak (University of Warsaw)</li>
+<li>Gilles Privat (Orange S.A.)</li>
+<li>Jan Hidders (Birkbeck College, University of London)</li>
+<li>Joshua Shinavier (LinkedIn)</li>
+<li>Juan Sequeda (data.world)</li>
+<li>Koji Annoura (UTI, Inc.)</li>
+<li>Leonid Libkin (ENS Paris, University of Edinburgh)</li>
+<li>Liat Peterfreund (ENS Paris)</li>
+<li>Michael Schmidt (Amazon Web Services)</li>
+<li>Paolo Guagliardo (University of Edinburgh)</li>
+<li>Slawek Staworko (Université de Lille)</li>
+<li>Stefania Dumbrava (Ecole Nationale Supérieure d&rsquo;Informatique pour l&rsquo;Industrie et l&rsquo;Entreprise (ENSIIE))</li>
+<li>Victor Lee (TigerGraph)</li>
+<li>Wim Martens (University of Bayreuth)</li>
+<li>Wook-Shin Han (POSTECH)</li>
+</ul>
+<h2 id="threshold-queries">Threshold queries</h2>
+<ul>
+<li>Angela Bonifati (Lyon 1 University)</li>
+<li>Dominik Tomaszuk (University of Bialystok)</li>
+<li>Filip Murlak (University of Warsaw)</li>
+<li>George Fletcher (Eindhoven TU)</li>
+<li>Jan Hidders (Birkbeck College, University of London)</li>
+<li>Joshua Shinavier (LinkedIn)</li>
+<li>Matthias Hofer (University of Bayreuth)</li>
+<li>Slawek Staworko (Université de Lille)</li>
+<li>Stefania Dumbrava (Ecole Nationale Supérieure d&rsquo;Informatique pour l&rsquo;Industrie et l&rsquo;Entreprise (ENSIIE))</li>
+<li>Wim Martens (University of Bayreuth)</li>
+</ul>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<section class="section bg-gray bg-dots">
+  <div class="container">
+    <div class="row">
+      <div class="col-12 text-center">
+        <div class="section-title-border border-center"></div>
+        <h2 class="section-title">Latest Working Group Updates</h2>
+      </div>
+      <div class="col-10 mx-auto">
+    <h4 class="mb-4"></h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">
+          <h4 class="mt-0">Launching open-source language tools for ISO/IEC GQL</h4>
+        </a>
+        09 May 2024
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and …</p>
+      </div>
+      
+      
+    </div>
+    
+      </div>
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/images/cube_1.png b/images/cube_1.png
new file mode 100644
index 00000000..4aa4affc
Binary files /dev/null and b/images/cube_1.png differ
diff --git a/images/cube_2.png b/images/cube_2.png
new file mode 100644
index 00000000..24c0f989
Binary files /dev/null and b/images/cube_2.png differ
diff --git a/images/cube_full.png b/images/cube_full.png
new file mode 100644
index 00000000..4494f35b
Binary files /dev/null and b/images/cube_full.png differ
diff --git a/images/favicon.ico b/images/favicon.ico
new file mode 100644
index 00000000..30ec30d8
Binary files /dev/null and b/images/favicon.ico differ
diff --git a/images/favicon.png b/images/favicon.png
new file mode 100644
index 00000000..3df75eb3
Binary files /dev/null and b/images/favicon.png differ
diff --git a/images/graphscope.svg b/images/graphscope.svg
new file mode 100644
index 00000000..06b5800e
--- /dev/null
+++ b/images/graphscope.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 265.83 173.83"><defs><style>.cls-1{fill:#333;}.cls-2{fill:#2281f2;}.cls-3{fill:#1fb2fd;}.cls-4{fill:#37edd7;}</style></defs><title>资源 2xxx</title><g id="图层_2" data-name="图层 2"><g id="图层_1-2" data-name="图层 1"><path class="cls-1" d="M33,146.84c0,.45,0,1.34-.05,2.67a17.16,17.16,0,0,1-.19,2.63q-1.22,6.17-5.33,9.11a17.71,17.71,0,0,1-10.53,2.94,19.93,19.93,0,0,1-8.68-1.81,13.46,13.46,0,0,1-6-5.68A19.68,19.68,0,0,1,0,146.84,19.66,19.66,0,0,1,2.22,137a13.48,13.48,0,0,1,6-5.69,20.08,20.08,0,0,1,8.68-1.8,16.26,16.26,0,0,1,11.71,5A14.3,14.3,0,0,1,32,140.09h-6.7A8.68,8.68,0,0,0,22,136.47,9.13,9.13,0,0,0,16.92,135a10.67,10.67,0,0,0-5.35,1.33,9.35,9.35,0,0,0-3.74,4,14.25,14.25,0,0,0-1.37,6.56,14.39,14.39,0,0,0,1.37,6.58,9.12,9.12,0,0,0,3.74,4,10.87,10.87,0,0,0,5.35,1.31,10.47,10.47,0,0,0,5.9-1.67,8.57,8.57,0,0,0,3.5-4.89h-9.4v-5.3Z"/><path class="cls-1" d="M48.83,144.91a9.66,9.66,0,0,0-4,2.07A6,6,0,0,0,43,151.8v12.39H36.87V151.56a11.6,11.6,0,0,1,1.62-6,12.15,12.15,0,0,1,4.36-4.36,11.66,11.66,0,0,1,6-1.61Z"/><path class="cls-1" d="M68.88,141.27A9,9,0,0,1,72,144.43a8.37,8.37,0,0,1,1.18,4.34v15.42H58.61a7.56,7.56,0,0,1-3.92-1.06,7.82,7.82,0,0,1-2.87-2.87,7.57,7.57,0,0,1-1.06-3.93,7.47,7.47,0,0,1,1.06-3.9,7.9,7.9,0,0,1,6.79-3.86h8.54a3.3,3.3,0,0,0-1-2.38,3.1,3.1,0,0,0-2.31-1H55.38v-5.11h9.16A8.27,8.27,0,0,1,68.88,141.27Zm-1.73,17.62V153.2H59.67a2.68,2.68,0,0,0-2,.84,2.9,2.9,0,0,0-.8,2.05,2.69,2.69,0,0,0,.82,1.95,2.63,2.63,0,0,0,2,.85Z"/><path class="cls-1" d="M98.74,142.89q3.11,2.79,3.11,8.53c0,3.82-1,6.67-3.11,8.53a11.62,11.62,0,0,1-8.07,2.79H85.08v11.09H79V140.09H90.67A11.57,11.57,0,0,1,98.74,142.89Zm-8.07,14.55a4.62,4.62,0,0,0,2.43-.72A5.44,5.44,0,0,0,95,154.65a7.33,7.33,0,0,0,0-6.46,5.55,5.55,0,0,0-1.93-2.08,4.62,4.62,0,0,0-2.43-.72H85.08v12.05Z"/><path class="cls-1" d="M112.74,141.54h5.88a7.88,7.88,0,0,1,4,1.08,8,8,0,0,1,2.94,2.94,7.88,7.88,0,0,1,1.08,4v14.6H120.6V150.74a3.86,3.86,0,0,0-3.9-3.9h-4v17.35h-6.07V130.45h6.07Z"/><path class="cls-1" d="M153.91,135.94H142.34a7.5,7.5,0,0,0-4.32,1.21,3.48,3.48,0,0,0-1.32,4.72,3.86,3.86,0,0,0,2.41,1.69,33.88,33.88,0,0,0,4.67.87c1.74.22,3.2.46,4.39.72a11.32,11.32,0,0,1,3.23,1.21,12.09,12.09,0,0,1,3.9,3.49,7.69,7.69,0,0,1,1.5,4.56,8.28,8.28,0,0,1-1.66,5,11,11,0,0,1-4.56,3.5,15.79,15.79,0,0,1-6.31,1.25h-13.5V158.7h13.5a7.47,7.47,0,0,0,4.31-1.21,3.57,3.57,0,0,0,1.76-3,3.24,3.24,0,0,0-.87-2.19,6,6,0,0,0-2.31-1.57,25.73,25.73,0,0,0-3.62-.67l-1.88-.29q-6.75-1.06-9.25-3.57a8.52,8.52,0,0,1-1.93-2.72,7.79,7.79,0,0,1-.67-3.21,8,8,0,0,1,1.68-4.89,11.78,11.78,0,0,1,4.56-3.56,14.72,14.72,0,0,1,6.29-1.33h11.57Z"/><path class="cls-1" d="M179.69,141.66a11.59,11.59,0,0,1,4.29,5.9h-6.65a6.53,6.53,0,0,0-1.88-1.73,4.74,4.74,0,0,0-2.6-.73,5.94,5.94,0,0,0-4.48,1.81,8.73,8.73,0,0,0,0,10.46,5.94,5.94,0,0,0,4.48,1.81,4.77,4.77,0,0,0,2.67-.73,6,6,0,0,0,1.81-1.73H184a11.59,11.59,0,0,1-4.29,5.9,12.38,12.38,0,0,1-7.28,2,12.63,12.63,0,0,1-8.84-3.08q-3.39-3.09-3.4-9.45t3.4-9.45a12.68,12.68,0,0,1,8.84-3.08A12.38,12.38,0,0,1,179.69,141.66Z"/><path class="cls-1" d="M205.17,141.27a10.85,10.85,0,0,1,4.14,4.51,15,15,0,0,1,0,12.72,10.85,10.85,0,0,1-4.14,4.51,13.5,13.5,0,0,1-13,0,10.85,10.85,0,0,1-4.14-4.51,14.86,14.86,0,0,1,0-12.72,10.85,10.85,0,0,1,4.14-4.51,13.5,13.5,0,0,1,13,0Zm-2,16.1a9.92,9.92,0,0,0,0-10.46,6.05,6.05,0,0,0-9,0,10,10,0,0,0,0,10.46,6.05,6.05,0,0,0,9,0Z"/><path class="cls-1" d="M235.29,142.89c2.08,1.86,3.11,4.7,3.11,8.53s-1,6.67-3.11,8.53a11.62,11.62,0,0,1-8.07,2.79h-5.59v11.09h-6.08V140.09h11.67A11.57,11.57,0,0,1,235.29,142.89Zm-8.07,14.55a4.6,4.6,0,0,0,2.43-.72,5.44,5.44,0,0,0,1.93-2.07,7.33,7.33,0,0,0,0-6.46,5.55,5.55,0,0,0-1.93-2.08,4.6,4.6,0,0,0-2.43-.72h-5.59v12.05Z"/><path class="cls-1" d="M259.68,140.89a10.09,10.09,0,0,1,4.46,4,13.16,13.16,0,0,1,1.69,7v3H248q1,3.86,5.26,4h8.87v5.3h-8.58a13,13,0,0,1-9-3q-3.34-3-3.35-9.3A12.91,12.91,0,0,1,243,145a10.53,10.53,0,0,1,4.49-4.05,15,15,0,0,1,12.19,0Zm.07,9.18a5.79,5.79,0,0,0-1.73-3.74,6,6,0,0,0-4.29-1.42,5.4,5.4,0,0,0-6,5.16Z"/><path class="cls-2" d="M132.84,45.54V36.22l2.94-2,6.44-4.45v-6.1l-14.13,9.43a26.21,26.21,0,0,0-6.4,5.84v.2Z"/><path class="cls-2" d="M108.61,37.91c2.88-6.29,11.59-13,11.59-13L149,6,137.81,0,116,14.15S94.35,27.31,96,48.93c1.3,17,22.42,22.2,22.42,22.2C106,66.08,104.57,46.73,108.61,37.91Z"/><path class="cls-3" d="M149,6l-28.77,19s-8.71,6.69-11.59,13c-4.32,9.42-2.34,31,12.51,34,0,0,6.2,1.49,17.19-4.72,5.75-3.25,13.35,3.22,13.35,3.22,8.66-6.62,2.16-13-4.81-15.33C140,52.8,135,57.41,127.63,59.3s-9.28-6.51-9.28-6.51-3.46-10.92,9.74-19.72l14.13-9.43v6.1l-9.38,6.48v9.32l16.45-10.95Z"/><path class="cls-4" d="M162.42,50.1c-8.19-6.77-19.52-6.33-28.5-3.55-4.87,1.51-15.56,6.24-15.56,6.24a10.74,10.74,0,0,0,.45,1.4c.06.15.13.32.21.49s.15.33.24.5.25.49.4.74.2.32.31.48.34.47.52.7.3.34.46.5a6.57,6.57,0,0,0,2.58,1.66l.5.14a7.28,7.28,0,0,0,3.6-.1h.05c4.75-1.23,8.34-3.55,12-4.34a12.16,12.16,0,0,1,7.2.17c7,2.38,13.47,8.71,4.81,15.33h0L128.77,85.21h0l-6.28-3.66,14.06-8.64-9.21-4.82L104.09,82h0l16.07,8.73h0l11.33,6.15,32-21.14S178.64,63.52,162.42,50.1Z"/><path class="cls-3" d="M169.9,63.41h0s0,.08,0,.12c-.18,7.18-6.44,12.25-6.44,12.25l-32,21.14v15.19l33-23c5.51-3.21,5.41-10.33,5.41-10.33Z"/><polygon class="cls-2" points="136.56 72.91 136.56 72.91 136.56 72.91 122.5 81.55 128.65 85.14 128.87 85.15 136.56 80.19 136.56 72.91"/><polygon class="cls-2" points="131.49 96.92 104.09 82.03 104.1 96.21 131.5 112.11 131.49 96.92"/></g></g></svg>
\ No newline at end of file
diff --git a/images/ldbc-title.png b/images/ldbc-title.png
new file mode 100644
index 00000000..a09f58fb
Binary files /dev/null and b/images/ldbc-title.png differ
diff --git a/images/ldbc.png b/images/ldbc.png
new file mode 100644
index 00000000..3df75eb3
Binary files /dev/null and b/images/ldbc.png differ
diff --git a/images/members/alibaba-cloud.png b/images/members/alibaba-cloud.png
new file mode 100644
index 00000000..13b9be68
Binary files /dev/null and b/images/members/alibaba-cloud.png differ
diff --git a/images/members/alibaba-damo-academy.png b/images/members/alibaba-damo-academy.png
new file mode 100644
index 00000000..3cb019aa
Binary files /dev/null and b/images/members/alibaba-damo-academy.png differ
diff --git a/images/members/antgroup.png b/images/members/antgroup.png
new file mode 100644
index 00000000..530d1e31
Binary files /dev/null and b/images/members/antgroup.png differ
diff --git a/images/members/arangodb.png b/images/members/arangodb.png
new file mode 100644
index 00000000..2bf688a9
Binary files /dev/null and b/images/members/arangodb.png differ
diff --git a/images/members/aws.png b/images/members/aws.png
new file mode 100644
index 00000000..50bd7486
Binary files /dev/null and b/images/members/aws.png differ
diff --git a/images/members/birkbeck.jpg b/images/members/birkbeck.jpg
new file mode 100644
index 00000000..944188d0
Binary files /dev/null and b/images/members/birkbeck.jpg differ
diff --git a/images/members/createlink.png b/images/members/createlink.png
new file mode 100644
index 00000000..c0b31a29
Binary files /dev/null and b/images/members/createlink.png differ
diff --git a/images/members/ens-paris.png b/images/members/ens-paris.png
new file mode 100644
index 00000000..70ab294f
Binary files /dev/null and b/images/members/ens-paris.png differ
diff --git a/images/members/fabarta.jpg b/images/members/fabarta.jpg
new file mode 100644
index 00000000..9fe574a4
Binary files /dev/null and b/images/members/fabarta.jpg differ
diff --git a/images/members/forth.png b/images/members/forth.png
new file mode 100644
index 00000000..ef3b6ac3
Binary files /dev/null and b/images/members/forth.png differ
diff --git a/images/members/intel.png b/images/members/intel.png
new file mode 100644
index 00000000..a53621a4
Binary files /dev/null and b/images/members/intel.png differ
diff --git a/images/members/jcc.png b/images/members/jcc.png
new file mode 100644
index 00000000..ad2acd0c
Binary files /dev/null and b/images/members/jcc.png differ
diff --git a/images/members/memgraph.png b/images/members/memgraph.png
new file mode 100644
index 00000000..275528ca
Binary files /dev/null and b/images/members/memgraph.png differ
diff --git a/images/members/nebulagraph.png b/images/members/nebulagraph.png
new file mode 100644
index 00000000..34fcb91d
Binary files /dev/null and b/images/members/nebulagraph.png differ
diff --git a/images/members/neo4j.png b/images/members/neo4j.png
new file mode 100644
index 00000000..84469cd6
Binary files /dev/null and b/images/members/neo4j.png differ
diff --git a/images/members/ontotext.jpg b/images/members/ontotext.jpg
new file mode 100644
index 00000000..1692fb75
Binary files /dev/null and b/images/members/ontotext.jpg differ
diff --git a/images/members/oracle-labs.png b/images/members/oracle-labs.png
new file mode 100644
index 00000000..86fe547e
Binary files /dev/null and b/images/members/oracle-labs.png differ
diff --git a/images/members/pometry.png b/images/members/pometry.png
new file mode 100644
index 00000000..53333010
Binary files /dev/null and b/images/members/pometry.png differ
diff --git a/images/members/redis-labs.png b/images/members/redis-labs.png
new file mode 100644
index 00000000..f86a9d3b
Binary files /dev/null and b/images/members/redis-labs.png differ
diff --git a/images/members/relationalai.png b/images/members/relationalai.png
new file mode 100644
index 00000000..7cdbe348
Binary files /dev/null and b/images/members/relationalai.png differ
diff --git a/images/members/sparsity.png b/images/members/sparsity.png
new file mode 100644
index 00000000..a2926454
Binary files /dev/null and b/images/members/sparsity.png differ
diff --git a/images/members/stargraph.png b/images/members/stargraph.png
new file mode 100644
index 00000000..75564389
Binary files /dev/null and b/images/members/stargraph.png differ
diff --git a/images/members/thatdot.png b/images/members/thatdot.png
new file mode 100644
index 00000000..ba97b9ba
Binary files /dev/null and b/images/members/thatdot.png differ
diff --git a/images/members/tigergraph.png b/images/members/tigergraph.png
new file mode 100644
index 00000000..fc8e0984
Binary files /dev/null and b/images/members/tigergraph.png differ
diff --git a/images/members/ultipa.png b/images/members/ultipa.png
new file mode 100644
index 00000000..61f8afc8
Binary files /dev/null and b/images/members/ultipa.png differ
diff --git a/images/members/volcengine.png b/images/members/volcengine.png
new file mode 100644
index 00000000..3d2c9371
Binary files /dev/null and b/images/members/volcengine.png differ
diff --git a/images/slide-image-1.jpg b/images/slide-image-1.jpg
new file mode 100644
index 00000000..17ff8d92
Binary files /dev/null and b/images/slide-image-1.jpg differ
diff --git a/images/slide-image-2.jpg b/images/slide-image-2.jpg
new file mode 100644
index 00000000..af1cac9f
Binary files /dev/null and b/images/slide-image-2.jpg differ
diff --git a/images/slide-image-3.jpg b/images/slide-image-3.jpg
new file mode 100644
index 00000000..970ebbe7
Binary files /dev/null and b/images/slide-image-3.jpg differ
diff --git a/images/slide-image-4.jpg b/images/slide-image-4.jpg
new file mode 100644
index 00000000..880ea210
Binary files /dev/null and b/images/slide-image-4.jpg differ
diff --git a/images/steering-committee-pictures/alastair-green.jpg b/images/steering-committee-pictures/alastair-green.jpg
new file mode 100644
index 00000000..4a4fa88f
Binary files /dev/null and b/images/steering-committee-pictures/alastair-green.jpg differ
diff --git a/images/steering-committee-pictures/ben-steer.jpg b/images/steering-committee-pictures/ben-steer.jpg
new file mode 100644
index 00000000..fd6e0ff4
Binary files /dev/null and b/images/steering-committee-pictures/ben-steer.jpg differ
diff --git a/images/steering-committee-pictures/gabor-szarnyas.jpg b/images/steering-committee-pictures/gabor-szarnyas.jpg
new file mode 100644
index 00000000..a47d1d3e
Binary files /dev/null and b/images/steering-committee-pictures/gabor-szarnyas.jpg differ
diff --git a/images/steering-committee-pictures/judy-bingham.jpg b/images/steering-committee-pictures/judy-bingham.jpg
new file mode 100644
index 00000000..d3acc221
Binary files /dev/null and b/images/steering-committee-pictures/judy-bingham.jpg differ
diff --git a/images/steering-committee-pictures/oskar-van-rest.jpg b/images/steering-committee-pictures/oskar-van-rest.jpg
new file mode 100644
index 00000000..a2a58161
Binary files /dev/null and b/images/steering-committee-pictures/oskar-van-rest.jpg differ
diff --git a/images/steering-committee-pictures/peter-boncz.jpg b/images/steering-committee-pictures/peter-boncz.jpg
new file mode 100644
index 00000000..49b1bb77
Binary files /dev/null and b/images/steering-committee-pictures/peter-boncz.jpg differ
diff --git a/images/steering-committee-pictures/shipeng-qi.jpg b/images/steering-committee-pictures/shipeng-qi.jpg
new file mode 100644
index 00000000..e41ea82f
Binary files /dev/null and b/images/steering-committee-pictures/shipeng-qi.jpg differ
diff --git a/index.html b/index.html
new file mode 100644
index 00000000..94acb1f2
--- /dev/null
+++ b/index.html
@@ -0,0 +1,488 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Linked Data Benchmark Council</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- slider -->
+<section>
+  <div class="hero-slider">
+    
+    <!-- slider item -->
+    <div class="hero-slider-item bg-cover hero-section" style="background-image:linear-gradient(rgba(0, 0, 0, 0.24), rgba(0, 0, 0, 0.24)), url('https://ldbcouncil.org'),url('https://ldbcouncil.org/images/slide-image-1.jpg');">
+      <div class="container">
+        <div class="row">
+          <div class="col-lg-10" data-duration-in=".3" data-animation-in="fadeInRight" data-delay-in=".1">
+            <h1 class="mb-4" style="color:#fff">Welcome to the LDBC website</h1>
+            <h4 class="mb-0 letter-spacing" style="color:#fff">On this website, you can find information on benchmark specifications and audited results, on how the LDBC organization works, and benchmarking resources.</h4>
+            <p class="mb-5"></p>
+            
+            <a href="https://ldbcouncil.org/introduction" class="btn btn-primary-outline" data-duration-in=".3"
+              data-animation-in="zoomIn" data-delay-in=".4">Read More</a>
+            
+          </div>
+        </div>
+      </div>
+    </div>
+    
+    <!-- slider item -->
+    <div class="hero-slider-item bg-cover hero-section" style="background-image:linear-gradient(rgba(0, 0, 0, 0.24), rgba(0, 0, 0, 0.24)), url('https://ldbcouncil.org'),url('https://ldbcouncil.org/images/slide-image-2.jpg');">
+      <div class="container">
+        <div class="row">
+          <div class="col-lg-10" data-duration-in=".3" data-animation-in="fadeInRight" data-delay-in=".1">
+            <h1 class="mb-4" style="color:#fff">Community engagement</h1>
+            <h4 class="mb-0 letter-spacing" style="color:#fff">LDBC brings industry and users together for developing benchmarks whereby the state-of-the-art and advances in graph database technologies can be assessed and directed.</h4>
+            <p class="mb-5"></p>
+            
+            <a href="https://ldbcouncil.org/gql-community/overview" class="btn btn-primary-outline" data-duration-in=".3"
+              data-animation-in="zoomIn" data-delay-in=".4">Read More</a>
+            
+          </div>
+        </div>
+      </div>
+    </div>
+    
+    <!-- slider item -->
+    <div class="hero-slider-item bg-cover hero-section" style="background-image:linear-gradient(rgba(0, 0, 0, 0.24), rgba(0, 0, 0, 0.24)), url('https://ldbcouncil.org'),url('https://ldbcouncil.org/images/slide-image-3.jpg');">
+      <div class="container">
+        <div class="row">
+          <div class="col-lg-10" data-duration-in=".3" data-animation-in="fadeInRight" data-delay-in=".1">
+            <h1 class="mb-4" style="color:#fff">Benchmarks</h1>
+            <h4 class="mb-0 letter-spacing" style="color:#fff">LDBC&rsquo;s benchmarks include the Social Network Benchmark suite, the Semantic Publishing Benchmark, and Graphalytics.</h4>
+            <p class="mb-5"></p>
+            
+            <a href="https://ldbcouncil.org/benchmarks/overview" class="btn btn-primary-outline" data-duration-in=".3"
+              data-animation-in="zoomIn" data-delay-in=".4">Read More</a>
+            
+          </div>
+        </div>
+      </div>
+    </div>
+    
+    <!-- slider item -->
+    <div class="hero-slider-item bg-cover hero-section" style="background-image:linear-gradient(rgba(0, 0, 0, 0.24), rgba(0, 0, 0, 0.24)), url('https://ldbcouncil.org'),url('https://ldbcouncil.org/images/slide-image-4.jpg');">
+      <div class="container">
+        <div class="row">
+          <div class="col-lg-10" data-duration-in=".3" data-animation-in="fadeInRight" data-delay-in=".1">
+            <h1 class="mb-4" style="color:#fff">Industry</h1>
+            <h4 class="mb-0 letter-spacing" style="color:#fff">On these pages, we provide information on the LDBC organization and its members, inclusive information on how to become a member.</h4>
+            <p class="mb-5"></p>
+            
+            <a href="https://ldbcouncil.org/becoming-a-member/" class="btn btn-primary-outline" data-duration-in=".3"
+              data-animation-in="zoomIn" data-delay-in=".4">Read More</a>
+            
+          </div>
+        </div>
+      </div>
+    </div>
+    
+  </div>
+</section>
+<!-- /slider -->
+
+
+
+
+
+<!-- case study -->
+
+<!-- /case study -->
+
+
+
+
+<section class="section bg-gray bg-dots">
+  <div class="container">
+    <div class="row">
+      <div class="col-12 text-center">
+        <div class="section-title-border border-center"></div>
+        <h2 class="section-title">Latest Updates</h2>
+      </div>
+      <div class="col-10 mx-auto">
+    <h4 class="mb-4"></h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h4 class="mt-0">Eighteenth TUC Meeting</h4>
+        </a>
+        24 Apr 2024
+        <p><strong>Organizers:</strong> Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located in <strong>Guangzhou</strong> with <a href="https://vldb.org/2024/">VLDB 2024</a> on <strong>August 30-31 (Friday-Saturday)</strong>.</p>
+<p>The …</p>
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h4 class="mt-0">Seventeenth TUC Meeting</h4>
+        </a>
+        18 Apr 2024
+        <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El …</strong></p>
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h4 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h4>
+        </a>
+        26 May 2024
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved …</li></ul>
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">
+          <h4 class="mt-0">Launching open-source language tools for ISO/IEC GQL</h4>
+        </a>
+        09 May 2024
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and …</p>
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">
+          <h4 class="mt-0">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</h4>
+        </a>
+        27 Jun 2023
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting …</p>
+      </div>
+      
+      
+    </div>
+    
+      </div>
+    </div>
+  </div>
+</section>
+  <!-- latest post -->
+
+
+
+<!-- blog -->
+
+<!-- /blog -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/index.json b/index.json
new file mode 100644
index 00000000..3fbe7572
--- /dev/null
+++ b/index.json
@@ -0,0 +1 @@
+[{"categories":null,"contents":"Organizers: Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)\nLDBC is hosting a two-day hybrid workshop, co-located in Guangzhou with VLDB 2024 on August 30-31 (Friday-Saturday).\nThe program consists of 10- and 15-minute talks followed by a Q\u0026amp;A session. The talks will be recorded and made available online. If you would like to participate please register using our form.\nProgram All times are in PDT.\nAugust 30, Friday Location: Langham Place, Guangzhou, room 1,\nco-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map here.\nAgenda: TBA\nAugust 31, Saturday Location: Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map here.\nAgenda: TBA\nTUC event locations A map of the LDBC TUC events we hosted so far.\n","permalink":"https://ldbcouncil.org/event/eighteenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Eighteenth TUC Meeting"},{"categories":null,"contents":"Organizers: Renzo Angles, Sebastián Ferrada\nLDBC is hosting a one-day in-person workshop, co-located in Santiago de Chile with SIGMOD 2024 on June 9 (Sunday).\nThe workshop will be held in the Hotel Plaza El Bosque Ebro (https://www.plazaelbosque.cl), which is two blocks away from SIGMOD\u0026rsquo;s venue. See the map here.\nIf you would like to participate please register using this form.\nProgram All times are in Chile time (GMT-4).\nEach speaker will have 20 minutes for exposition plus 5 minutes for questions.\nTime Speaker Title 09:00 Welcome \u0026ldquo;Canelo\u0026rdquo; saloon 09:30 Alastair Green (LDBC Vice-chair) Status of the LDBC Extended GQL Schema Working Group 10:00 Hannes Voigt (Neo4j) Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced 10:30 Calin Iorgulescu (Oracle) PGX.D: Distributed graph processing engine 11:00 Coffee break 11:30 Ricky Sun (Ultipa, Inc.) A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering 12:00 Daan de Graaf (TU Eindhoven) Algorithm Support in a Graph Database, Done Right 12:30 Angela Bonifati (Lyon 1 University and IUF, France) Transforming Property Graphs 13:00 Brunch 14:00 Juan Sequeda (data.world) A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model\u0026rsquo;s Accuracy for Question Answering on Enterprise SQL Databases 14:30 Olaf Hartig (Linköping University) FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines 15:00 Olaf Hartig (Amazon) Datatypes for Lists and Maps in RDF Literals 15:30 Peter Boncz (CWI and MotherDuck) The state of DuckPGQ 16:00 Coffee break 16:30 Juan Reutter (IMFD and PUC Chile) MillenniumDB: A Persistent, Open-Source, Graph Database 17:00 Carlos Rojas (IMFD) WDBench: A Wikidata Graph Query Benchmark 17:30 Sebastián Ferrada (IMFD and Univ. de Chile) An algebra for evaluating path queries 19:30 Dinner ","permalink":"https://ldbcouncil.org/event/seventeenth-tuc-meeting/","tags":["TUC Meeting","Santiago","Chile"],"title":"Seventeenth TUC Meeting"},{"categories":null,"contents":"We are happy to annonunce new audited results for the SNB Interactive workload, achieved by the open-source GraphScope Flex system.\nThe current audit of the system has broken several records:\nIt achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s. It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s. It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s The audit was commissioned by the Alibaba Cloud and was conducted by Dr. Arnau Prat-Pérez, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud\u0026rsquo;s infrastructure. The executive summary, full disclosure report, and supplementary package describe the benchmark\u0026rsquo;s steps and include instructions for reproduction.\nLDBC would like to congratulate the GraphScope Flex team on their record-breaking results.\n","permalink":"https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/","tags":["benchmark","snb"],"title":"Record-Breaking SNB Interactive Results for GraphScope"},{"categories":null,"contents":"Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this announcement from Alastair Green, Vice-chair of LDBC.\nThese tools are the work of the LDBC GQL Implementation Working Group, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.\n","permalink":"https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/","tags":["gql"],"title":"Launching open-source language tools for ISO/IEC GQL"},{"categories":null,"contents":"By Alastair Green, Vice-chair LDBC, and author of the GQL Manifesto.\n9 May 2024\nThe GQL standard was published in mid-April by ISO. See WG3 Convenor Keith Hare’s summary: ISO/IEC JTC 1 GQL Database Language\nLinked Data Benchmark Council (LDBC) is releasing early-version open-source GQL grammar tools.\nOpen GQL Language Tools There are three interlinked projects:\nANTLR grammar repository GQL Code Editor Web UI (and repository) Railroad Diagrams Web Page (and repository) A commit of a new version of the grammar automatically rebuilds and deploys the Code Editor and the Railroad Diagrams.\nMichael Burbidge (who leads our GQL Implementation Working Group), Damian Wileński, and Dominik Tomaszuk are responsible for making all this happen, so soon after the release of GQL. Wonderful work!\nThe tools are a work in progress, so expect evolution. Feel free to raise issues on Github.\nThe mission of the GQL Implementation Working Group is to create tooling and documentation to assist in and accelerate the implementation and adoption of GQL. See the working group charter for more information.\nCode examples for Technical Reports The Code Editor lets you create syntactically correct GQL examples. It is not connected to an implementation of the GQL spec, so type checking, variable scoping rules, etc., that are typically done by semantic analysis of the parse tree, are not enforced by the Code Editor.\nI used Code Editor to create/check the code examples in my last post on LinkedIn, GQL in code, which links through to\nGQL on one page: DDL, DML and GPML\nIt is also being used to help create a forthcoming LDBC Technical Report on GQL, which (unlike the spec) will be freely available to all, and will contain numerous examples.\nTowards a GQL TCK More is in the works: we have begun work on a Test Compatibility Kit, modelled on the the openCypher TCK, but that’s a big job.\nWe need and welcome active contributions to all these community efforts.\nIf you are interested, please ping Michael at michael.burbidge@ldbcouncil.org.\nThe Linked Data Benchmark Council LDBC is a non-profit consortium of vendors, researchers and independent practitioners interested in graph data management.\nLDBC defines benchmark standards for graph data workloads (using RDF, SQL, and property graph languages). It is a meeting point and working space for community efforts supportive of the GQL and SQL/PGQ property graph standards.\nIt supervises the audited execution of comparable benchmark runs which are reported with cost metrics, following the lead of TPC. Only audited results published by LDBC can be described as LDBC Benchmark(R) results.\nLDBC is run by its 20+ organizational members including Oracle, Ant Group, Intel, Neo4j, TigerGraph, Fabarta, thatDot, Ontotext, ArangoDB, Relational AI, Stargraph, Nebula Graph, Sparksee, FORTH, Memgraph, Createlink, Alibaba DAMO Academy (Graphscope), Birkbeck University of London and AWS.\nThere are 70+ individual associate members (who join for free and support its working groups and task forces).\nRecent and current initiatives include the Finance Benchmark, LDBC Extended GQL Schema (LEX), and GQL Implementation.\nThe G-CORE, PG-Keys, Graph Pattern Matching in GQL and SQL/PGQ and PG-Schema papers (all published at SIGMOD) directly reflect the work of LDBC participants on graph data languages, over the years.\nLDBC is a Category C Liaison of ISO/IEC JTC1 SC32/WG3 (the SQL and GQL standards committee). Jan Hidders, Michael Burbidge and Alastair Green are LDBC’s representatives in WG3.\nFor all enquiries, including membership enquiries, please email info@ldbcouncil.org.\n","permalink":"https://ldbcouncil.org/pages/opengql-announce/","tags":["GQL"],"title":"LDBC open-source GQL tools"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-wc-wc-2023-03/","tags":[],"title":"LDBC GQL Implementation Work Charter 1.1"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-wc-wc-2023-01/","tags":[],"title":"LDBC Extended GQL Schema (LEX) Work Charter 1.1"},{"categories":null,"contents":"We are delighted to announce the official release of the initial version (v0.1.0) of Financial Benchmark (FinBench).\nThe Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the LDBC FinBench Task Force. The benchmark has one workload currently, Transaction Workload, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.\nCompared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the slides in the 16th TUC. The Financial Benchmark\u0026rsquo;s specification can be found on arXiv.\nThe release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.\nIf you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.\n","permalink":"https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/","tags":["finbench"],"title":"Announcing the Official Release of LDBC Financial Benchmark v0.1.0"},{"categories":null,"contents":"Organizers: Oskar van Rest, Alastair Green, Gábor Szárnyas\nLDBC is hosting a two-day hybrid workshop, co-located with SIGMOD 2023 on June 23-24 (Friday-Saturday).\nThe program consists of 10- and 15-minute talks followed by a Q\u0026amp;A session. The talks will be recorded and made available online. If you would like to participate please register using our form.\nLDBC will host a social event on Friday at the Black Bottle gastrotavern in Belltown: 2600 1st Ave (on the corner of Vine), Seattle, WA 98121.\nIn addition, AWS will host a Happy Hour (rooftop grill with beverages) on Saturday on the Amazon Nitro South building\u0026rsquo;s 8th floor deck: 2205 8th Ave, Seattle, WA 98121.\nProgram All times are in PDT.\nFriday Location: Hyatt Regency Bellevue on Seattle\u0026rsquo;s Eastside, room Grand K, co-located with SIGMOD (900 Bellevue Way NE, Bellevue, WA 98004-4272)\nstart finish speaker title 08:30 08:45 Oskar van Rest (Oracle) LDBC – State of the union – slides, video 08:50 09:05 Keith Hare (JCC / WG3) An update on the GQL \u0026amp; SQL/PGQ standards efforts – slides, video 09:10 09:25 Stefan Plantikow (Neo4j / WG3) GQL - Introduction to a new query language standard – slides 09:30 09:45 Leonid Libkin (University of Edinburgh \u0026amp; RelationalAI) Formalizing GQL – slides, video 09:50 10:05 Semen Panenkov (JetBrains Research) Mechanizing the GQL semantics in Coq – slides, videos 10:10 10:25 Oskar van Rest (Oracle) SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – slides, video 10:30 11:00 coffee break 11:00 11:15 Alastair Green (JCC) LDBC\u0026rsquo;s organizational changes and fair use policies – slides 11:20 11:35 Ioana Manolescu (INRIA) Integrating Connection Search in Graph Queries – slides, video 11:40 11:55 Maciej Besta (ETH Zurich) Neural Graph Databases with Graph Neural Networks – video 12:00 12:10 Longbin Lai (Alibaba Damo Academy) To Revisit Benchmarking Graph Analytics – slides, video 12:15 13:30 lunch 13:30 13:45 Yuanyuan Tian (Gray Systems Lab, Microsoft) The World of Graph Databases from An Industry Perspective – slides, video 13:50 14:05 Alin Deutsch (UC San Diego \u0026amp; TigerGraph) TigerGraph\u0026rsquo;s Parallel Computation Model – slides, video 14:10 14:25 Chen Zhang (CreateLink) Applications of a Native Distributed Graph Database in the Financial Industry – video 14:30 14:45 Ricky Sun (Ultipa) Design of highly scalable graph database systems – slides, video 14:50 15:30 coffee break 15:30 15:45 Heng Lin (Ant Group) The LDBC SNB implementation in TuGraph – slides, video 15:50 16:05 Shipeng Qi (Ant Group) FinBench: The new LDBC benchmark targeting financial scenario – slides, video 16:10 17:00 host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft) FinBench panel – slides 19:00 22:00 dinner Black Bottle gastrotavern in Belltown: 2600 1st Ave (on the corner of Vine), Seattle, WA 98121 Saturday Location: Amazon Nitro South building, room 03.204 (2205 8th Ave, Seattle, WA 98121)\nstart finish speaker title 09:00 09:45 Brad Bebee (AWS) Customers don\u0026rsquo;t want a graph database, so why are we still here? – slides, video 10:00 10:15 Muhammad Attahir Jibril (TU Ilmenau) Fast and Efficient Update Handling for Graph H2TAP – slides, video 10:20 11:00 coffee break 11:00 11:15 Gabor Szarnyas (CWI) LDBC Social Network Benchmark and Graphalytics – slides 11:20 11:30 Atanas Kiryakov and Tomas Kovachev (Ontotext) GraphDB – Benchmarking against LDBC SNB \u0026amp; SPB – slides, video 11:35 11:50 Roi Lipman (Redis Labs) Delta sparse matrices within RedisGraph – slides, video 11:55 12:05 Rathijit Sen (Microsoft) Microarchitectural Analysis of Graph BI Queries on RDBMS – slides, video 12:10 13:30 lunch on your own 13:30 13:45 Alastair Green (JCC) LEX \u0026ndash; LDBC Extended GQL Schema – slides, video 13:50 14:05 Ora Lassila (AWS) Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – slides, video 14:10 14:25 Jan Hidders (Birkbeck, University of London) PG-Schema: a proposal for a schema language for property graphs – slides, video 14:30 14:45 Max de Marzi (RageDB and RelationalAI) RageDB: Building a Graph Database in Anger – slides, video 14:50 15:30 coffee break 15:30 15:45 Umit Catalyurek (AWS) HPC Graph Analytics on the OneGraph Model – slides, video 15:50 16:05 David J. Haglin (Trovares) How LDBC impacts Trovares – slides, video 16:10 16:25 Wenyuan Yu (Alibaba Damo Academy) GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – slides, video 16:30 16:40 Scott McMillan (Carnegie Mellon University) Graph processing using GraphBLAS – slides, video 16:45 16:55 Tim Mattson (Intel) Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – slides 17:00 20:00 happy hour (rooftop grill with beverages) on the Nitro South building\u0026rsquo;s 8th floor deck TUC event locations A map of the LDBC TUC events we hosted so far.\n","permalink":"https://ldbcouncil.org/event/sixteenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Sixteenth TUC Meeting"},{"categories":null,"contents":"2023 has been an eventful year for us so far. Here is a summary of our recent activities.\nOur paper The LDBC Social Network Benchmark: Business Intelligence Workload was published in PVLDB.\nDavid Püroja just completed his MSc thesis on creating a design towards SNB Interactive v2 at CWI\u0026rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference\u0026rsquo;s graph developer room titled The LDBC Social Network Benchmark (YouTube mirror).\nI gave a lightning talk at FOSDEM\u0026rsquo;s HPC developer room titled The LDBC Benchmark Suite (YouTube mirror).\nOur auditors have successfully benchmark a number of systems:\nSPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze) SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja) SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr) The results and the full disclosure reports are available under the SPB and SNB benchmark pages.\n","permalink":"https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/","tags":["datagen","snb"],"title":"LDBC SNB – Early 2023 updates"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/david-puroja-msc/","tags":[],"title":"LDBC Social Network Benchmark Interactive v2"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/snb-work-charter/","tags":[],"title":"LDBC Social Network Benchmark task force work charter"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-2306-15975/","tags":[],"title":"The LDBC Financial Benchmark"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/tpctc-ldbc-snb-interactive-v-2/","tags":[],"title":"The LDBC Social Network Benchmark Interactive workload v2: A transactional graph query benchmark with deep delete operations"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/tpctc-ldbc-organization/","tags":[],"title":"The Linked Data Benchmark Council (LDBC): Driving competition and collaboration in the graph data management space"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-wc-wc-2022-02/","tags":[],"title":"LDBC Extended GQL Schema (LEX) Work Charter"},{"categories":null,"contents":"LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my last technical update on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark\u0026rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.\nMoving to SparkSQL We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL\u0026rsquo;s capabilites.\nSpark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.\nDealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees1, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators\u0026rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:\ntable manipulations related to shaping the output into the supported layouts and data types as set forth in the specification; deriving the Interactive and BI datasets; and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes. We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.\nThe diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there\u0026rsquo;s no simple way to avoid\nit, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.\nI\u0026rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the previous blogpost in the series or the Interactive benchmark specification.\nTransformation pipeline The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:\nexplodes edges and / or attributes into separate tables, subsets the snapshot part and creates insert / delete batches for the BI workload, subsets the snapshot part for the Interactive workload, applies formatting related options such as date time representation, serializes the data to a Spark supported format (CSV, Parquet), We utilize a flexible data pipeline that operates on the graph.\ntrait Transform[M1 \u0026lt;: Mode, M2 \u0026lt;: Mode] extends (Graph[M1] =\u0026gt; Graph[M2]) { type In = Graph[M1] type Out = Graph[M2] def transform(input: In): Out override def apply(v: Graph[M1]): Graph[M2] = transform(v) } The Transform trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let\u0026rsquo;s see some of the transformations we have.\ncase class RawToBiTransform(mode: BI, simulationStart: Long, simulationEnd: Long, keepImplicitDeletes: Boolean) extends Transform[Mode.Raw.type, Mode.BI] { override def transform(input: In): Out = ??? } case class RawToInteractiveTransform(mode: Mode.Interactive, simulationStart: Long, simulationEnd: Long) extends Transform[Mode.Raw.type, Mode.Interactive] { override def transform(input: In): Out = ??? } object ExplodeEdges extends Transform[Mode.Raw.type, Mode.Raw.type] { override def transform(input: In): Out = ??? } object ExplodeAttrs extends Transform[Mode.Raw.type, Mode.Raw.type] { override def transform(input: In): Out = ??? } Therefore, a transformation pipeline may look like this:\nval transform = ExplodeAttrs .andThen(ExplodeEdges) .andThen(RawToInteractiveTransform(params, start, end)) val outputGraph = transform(inputGraph) The Graph record has a definition field containing graph-global metadata, whereas entities holds the datasets keyed by their entity type. There are 3 graph modes currently: Raw, Interactive and BI. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the Layout dependent type, over which the entities are polymorphic.\nIt\u0026rsquo;s important to understand that Graph holds DataFrames, and these are lazily computed by Spark. So, Graph is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.\ncase class GraphDef[+M \u0026lt;: Mode]( isAttrExploded: Boolean, isEdgesExploded: Boolean, useTimestamp: Boolean, mode: M, entities: Map[EntityType, Option[String]] ) case class Graph[+M \u0026lt;: Mode]( definition: GraphDef[M], entities: Map[EntityType, M#Layout] ) sealed trait Mode { type Layout /* ... */ } object Mode { final case object Raw extends Mode { type Layout = DataFrame /* ... */ } final case class Interactive(bulkLoadPortion: Double) extends Mode { type Layout = DataFrame /* ... */ } final case class BI(bulkloadPortion: Double, batchPeriod: String) extends Mode { type Layout = BatchedEntity /* ... */ } } You may notice that Transform is statically typed w.r.t. Mode, however other properties, like isAttrExploded, or isEdgesExploded are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.\nAs we already mentioned, Graph is essentially a persistent container of EntityType -\u0026gt; DataFrame mappings. EntityType can be Node, Edge and Attr, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.\nUsually, a graph transformation involves matching entities based on their EntityType, and modifying the mapping (and if required, other metadata). Take, for example, the ExplodeAttrs transformation, which explodes into separate tables the values of two columns of Person stored as arrays:\nobject ExplodeAttrs extends Transform[Mode.Raw.type, Mode.Raw.type] { override def transform(input: In): Out = { if (input.definition.isAttrExploded) { // assert at runtime that the transformation hasn\u0026#39;t been applied yet throw new AssertionError(\u0026#34;Attributes already exploded in the input graph\u0026#34;) } def explodedAttr(attr: Attr, node: DataFrame, column: Column) = attr -\u0026gt; node.select(withRawColumns(attr, $\u0026#34;id\u0026#34;.as(s\u0026#34;${attr.parent}Id\u0026#34;), explode(split(column, \u0026#34;;\u0026#34;)).as(s\u0026#34;${attr.attribute}Id\u0026#34;))) val modifiedEntities = input.entities .collect { case (k @ Node(\u0026#34;Person\u0026#34;, false), df) =\u0026gt; // match the Person node. This is the only one ExplodeAttrs should modify Map( explodedAttr(Attr(\u0026#34;Email\u0026#34;, k, \u0026#34;EmailAddress\u0026#34;), df, $\u0026#34;email\u0026#34;), // add a new \u0026#34;PersonEmailEmailAddress\u0026#34; entity derived by exploding the email column of Person explodedAttr(Attr(\u0026#34;Speaks\u0026#34;, k, \u0026#34;Language\u0026#34;), df, $\u0026#34;language\u0026#34;), // add a new \u0026#34;PersonSpeaksLanguage\u0026#34; entity derived by exploding the language column of Person k -\u0026gt; df.drop(\u0026#34;email\u0026#34;, \u0026#34;language\u0026#34;) // drop the exploded columns from person ) } val updatedEntities = modifiedEntities .foldLeft(input.entities)(_ ++ _) // merge-replace the modified entities in the graph val updatedEntityDefinitions = modifiedEntities .foldLeft(input.definition.entities) { (e, v) =\u0026gt; e ++ v.map{ case (k, v) =\u0026gt; k -\u0026gt; Some(v.schema.toDDL) } // update the entity definition schema to reflect the modifications } val l = lens[In] // lenses provide a terse syntax for modifying nested fields (l.definition.isAttrExploded ~ l.definition.entities ~ l.entities).set(input)((true, updatedEntityDefinitions, updatedEntities)) } Note that EntityType does not hold the dataset\u0026rsquo;s full SQL schema currently, as it\u0026rsquo;s not useful for pattern matching, but can be accessed directly from DataFrame if needed.\nInput/output The Reader and Writer typeclasses are used to read from a Source and write to a Sink respectively, terminating a graph transformation pipeline\non both ends.\ntrait Reader[T] { type Ret def read(self: T): Ret def exists(self: T): Boolean } trait Writer[S] { type Data def write(self: Data, sink: S): Unit } There are implementations under ldbc.datagen.io.instances that read a graph from a GraphSource and write to a GraphSink.\nimport ldbc.snb.datagen.model import ldbc.snb.datagen.model.Mode import ldbc.snb.datagen.io.graphs.{GraphSource, GraphSink} import ldbc.snb.datagen.io.instances._ // read val inputPath = \u0026#34;path/to/input/graph\u0026#34; val inputFormat = \u0026#34;parquet\u0026#34; val source = GraphSource(model.graphs.Raw.graphDef, inputPath, inputFormat) val graph = Reader[GraphSource, Graph[Mode.Raw.type]].read(source) // transform val transform = ExplodeAttrs.andThen(ExplodeEdges) val transformedGraph = transform(graph) // write val outputPath = \u0026#34;path/to/output/graph\u0026#34; val outputFormat = \u0026#34;csv\u0026#34; val sink = GraphSink(outputPath, outputFormat) Writer[GraphSink, Graph[Mode.Raw.type]].write(transformedGraph, sink) We provide Ops syntax to make it shorter:\nimport ldbc.snb.datagen.model import ldbc.snb.datagen.model.Mode import ldbc.snb.datagen.io.graphs.{GraphSource, GraphSink} import ldbc.snb.datagen.io.instances._ import ldbc.snb.datagen.io.Reader.ops._ import ldbc.snb.datagen.io.Writer.ops._ // read val inputPath = \u0026#34;path/to/input/graph\u0026#34; val inputFormat = \u0026#34;parquet\u0026#34; val graph = GraphSource(model.graphs.Raw.graphDef, inputPath, inputFormat).read // transform val transformedGraph = ??? /* ... */ // write val outputPath = \u0026#34;path/to/output/graph\u0026#34; val outputFormat = \u0026#34;csv\u0026#34; transformedGraph.write(GraphSink(outputPath, outputFormat)) The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.\nSpark has a facility to derive SparkSQL schema from case classes automatically2. We created case classes for each entity in the Raw dataset. We also created a typeclass EntityTraits associating these classes with their EntityType, so we can summon them (and consequently their SparkSQL schema) in the reader.\nThe case classes are used during the serialization of the generated dataset too, but more about that later.\nFactor generation As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.\nWe decided it\u0026rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator\u0026rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use GraphX, which was unimaginable with the previous design.\nFactor tables are added by extending a map with a name -\u0026gt; Factor pair. Factor declares is input entities, and accepts a function that receives input DataFrames, and returns a single DataFrame as output.\nval factors = Map ( \u0026#34;personDisjointEmployerPairs\u0026#34; -\u0026gt; Factor(PersonType, PersonKnowsPersonType, OrganisationType, PersonWorkAtCompanyType) { case Seq(person, personKnowsPerson, organisation, workAt) =\u0026gt; val knows = undirectedKnows(personKnowsPerson) val company = organisation.where($\u0026#34;Type\u0026#34; === \u0026#34;Company\u0026#34;).cache() val personSample = person .orderBy($\u0026#34;id\u0026#34;) .limit(20) personSample .as(\u0026#34;Person2\u0026#34;) .join(knows.as(\u0026#34;knows\u0026#34;), $\u0026#34;knows.person2Id\u0026#34; === $\u0026#34;Person2.id\u0026#34;) .join(workAt.as(\u0026#34;workAt\u0026#34;), $\u0026#34;workAt.PersonId\u0026#34; === $\u0026#34;knows.Person1id\u0026#34;) .join(company.as(\u0026#34;Company\u0026#34;), $\u0026#34;Company.id\u0026#34; === $\u0026#34;workAt.CompanyId\u0026#34;) .select( $\u0026#34;Person2.id\u0026#34;.alias(\u0026#34;person2id\u0026#34;), $\u0026#34;Company.name\u0026#34;.alias(\u0026#34;companyName\u0026#34;), $\u0026#34;Company.id\u0026#34;.alias(\u0026#34;companyId\u0026#34;), $\u0026#34;Person2.creationDate\u0026#34;.alias(\u0026#34;person2creationDate\u0026#34;), $\u0026#34;Person2.deletionDate\u0026#34;.alias(\u0026#34;person2deletionDate\u0026#34;) ) .distinct() }, /* more factors */ ) As you can see, it\u0026rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. undirectedKnows). Currently, there\u0026rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.\nRevamping the data generator\u0026rsquo;s serializer At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator\u0026rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we\u0026rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.\nParquet is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.\nThe new serialization framework is heavily influenced by the design of Java OutputStreams, in the sense that stateful objects are composed to form a pipeline. For example, in case of activities, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).\nThe benefit of this architecture is that only the last component needs to change when we add support for a new output format.\nTo support Parquet, we made use of row-level serializers available in Hadoop\u0026rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the Raw entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. Forum) and Spark\u0026rsquo;s Encoder framework to encode the entities in Parquet, which means that the generated output remains consistent with DataFrame-based reader, and we spare a lot of code duplication.\nOptimizations After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks3 per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation4. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren\u0026rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.\n./tools/emr/submit_datagen_job.py sf3k_bi 3000 parquet bi \\ --sf-per-executor 3000 \\ --partitions 330 \\ --jar $JAR_NAME \\ --instance-type i3.4xlarge \\ --bucket $BUCKET_NAME \\ -- --explode-edges --explode-attrs ./tools/emr/submit_datagen_job.py sf10k_bi 10000 parquet bi \\ --sf-per-executor 3000 \\ --partitions 1000 \\ --jar $JAR_NAME \\ --instance-type i3.4xlarge \\ --bucket $BUCKET_NAME \\ -- --explode-edges --explode-attrs The above examples working configurations for generating the 3K and 10K BI datasets. The --sf-per-executor option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The --partitions option controls the total number of partitions, and was calculated based on the number of persons using the formula partitions = ceil(number_of_persons / block_size / 3) to get a maximum of 3 blocks per partition.\nConclusion These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.\nFootnotes The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nShameless plug: You can learn more on this from another blogpost of mine.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nThe datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nThe maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\n","permalink":"https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/","tags":["datagen","snb"],"title":"LDBC SNB Datagen – The winding path to SF100K"},{"categories":null,"contents":"Organizers: Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green\nLDBC is hosting a two-day hybrid workshop, co-located with SIGMOD 2022 on June 17-18 (Friday-Saturday).\nThe program consists of 10-15 minute talks followed by a Q\u0026amp;A session. The talks will be recorded and made available online.\nThe tenative program is the following. All times are in EDT.\nWe will have a social event on Friday at 17:30 at El Vez (Google Maps).\nFriday (Pennsylvania Convention Center, room 204B) start finish speaker title 09:20 09:30 Peter Boncz (LDBC/CWI) State of the union – slides, video 09:30 09:45 Alastair Green (LDBC/Birkbeck) LDBC\u0026rsquo;s fair use policies – slides, video 09:50 10:05 Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University) LDBC Social Network Benchmark: Business Intelligence workload v1.0 – slides, video 10:10 10:25 Heng Lin (Ant Group) LDBC Financial Benchmark introduction – slides, video 10:30 11:00 coffee break 11:00 11:15 Chen Zhang (CreateLink) New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – slides, video 11:20 11:35 James Clarkson (Neo4j) LDBC benchmarks: Promoting good science and industrial consumption – slides, video 11:40 11:55 Oskar van Rest (Oracle) Creating and querying property graphs in Oracle, on-premise and in the cloud – slides, video 12:00 12:15 Mingxi Wu (TigerGraph) Conquering LDBC SNB BI at SF-10k – slides, video 12:20 13:20 lunch (on your own) 13:20 13:35 Altan Birler (Technische Universität München) Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – slides, video 13:40 13:55 David Püroja (CWI) LDBC Social Network Benchmark: Interactive workload v2.0 – slides 14:00 14:15 Angela Bonifati (Lyon 1 University) The quest for schemas in graph databases – slides, video 14:20 14:35 Matteo Lissandrini (Aalborg University) Understanding graph data representations in triplestores – slides, video 14:40 14:55 Wim Martens (University of Bayreuth) Path representations – slides, video 15:00 15:20 Audrey Cheng\t(UC Berkeley) TAOBench: An end-to-end benchmark for social network workloads – slides, video Saturday (Philadelphia Marriott Downtown, room 401-402, 4th floor) start finish speaker title 10:00 10:15 Keith Hare (WG3) An update on the GQL \u0026amp; SQL/PGQ standards efforts – slides, video 10:20 10:35 Leonid Libkin (ENS Paris) Pattern matching in GQL and SQL/PGQ – slides, video 10:40 10:55 Petra Selmer (Neo4j/WG3) An overview of GQL – slides, video 11:00 11:15 Alastair Green (LDBC/WG3) GQL 2.0: A technical manifesto – slides, video 11:20 11:35 George Fletcher (TU Eindhoven) PG-Keys (LDBC Property Graph Schema Working Group) – slides, video 11:40 11:55 Arvind Shyamsundar (Microsoft) Graph capabilities in Microsoft SQL Server and Azure SQL Database – slides, video 12:00 13:30 lunch (on your own) 13:30 13:45 Daniël ten Wolde (CWI) Implementing SQL/PGQ in DuckDB – slides, video 13:50 14:05 Oszkár Semeráth, Kristóf Marussy (TU Budapest) Generation techniques for consistent, realistic, diverse, and scalable graphs – slides, video 14:10 14:25 Molham Aref (RelationalAI) Graph Normal Form – slides, video 14:30 14:45 Naomi Arnold (Queen Mary University of London) Temporal graph analysis of the far-right social network Gab – slides, video 14:50 15:05 Domagoj Vrgoč (PUC Chile) Evaluating path queries in MillenniumDB – slides, video 15:10 15:25 Pavel Klinov, Evren Sirin (Stardog) Stardog\u0026rsquo;s experience with LDBC – slides, video ","permalink":"https://ldbcouncil.org/event/fifteenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Fifteenth TUC Meeting"},{"categories":null,"contents":"We are delighted to announce the set up of the Financial Benchmark (FinBench) task force.\nThe Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.\nCompared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.\nThe FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the Work Charter for FinBench\nIf you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.\n","permalink":"https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/","tags":["finbench"],"title":"Announcing the LDBC Financial Benchmark Task Force"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/","tags":[],"title":"The LDBC Social Network Benchmark: Business Intelligence Workload"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalspvldb-bonifati-dfhhmms-22/","tags":[],"title":"Threshold Queries in Theory and in the Wild"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/fin-bench-work-charter/","tags":[],"title":"Work Charter for FinBench v1.0"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-tr-tr-2021-01/","tags":[],"title":"Property graphs and paths in GQL: Mathematical definitions"},{"categories":null,"contents":"LDBC was hosting a one-day hybrid workshop, co-located with VLDB 2021 on August 16 (Monday) between 16:00–20:00 CEST.\nThe physical part of the workshop was held in room Akvariet 2 of the Tivoli Hotel (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC\u0026rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.\nTalks were scheduled to be 10 minutes with a short Q\u0026amp;A session. We had three sessions. Their schedules are shown below.\n[16:00–17:25 CEST] LDBC updates, benchmarks, query languages start speaker title 16:00 Peter Boncz (CWI) State of the union – slides 16:05 Gábor Szárnyas (CWI) Overview of LDBC benchmarks – slides 16:12 Mingxi Wu (TigerGraph) LDBC Social Network Benchmark results with TigerGraph – slides 16:24 Xiaowei Zhu (Ant Group) Financial Benchmark proposal – slides 16:36 Petra Selmer (Neo4j) Status report from the Existing Languages Working Group (ELWG) – slides, video 16:48 Jan Hidders (Birkbeck) Status report from the Property Graph Schema Working Group (PGSWG) – slides, video 17:00 Keith Hare (JCC Consulting) Database Language Standards Structure and Process, SQL/PGQ – slides, video 17:12 Stefan Plantikow (GQL Editor) Report on the GQL standard – slides, video coffee break (10 minutes)\n[17:35–18:45 CEST] Systems and data structures start speaker title 17:35 Vasileios Trigonakis (Oracle Labs) PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System – slides, video 17:47 Matthias Hauck (SAP) JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud – slides, video 17:59 Nikolay Yakovets (Eindhoven University of Technology) AvantGraph – slides, video 18:11 Semih Salihoglu (University of Waterloo) GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins – slides, video 18:23 Semyon Grigorev (Saint Petersburg University) Context-free path querying: Obstacles on the way to adoption – slides, video 18:35 Per Fuchs (Technical University of Munich) Sortledton: A universal, transactional graph data structure – slides, video coffee break (10 minutes)\n[18:55-20:00 CEST] High-level approaches and benchmarks start speaker title 18:55 Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris) Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – slides, video 19:07 Vasia Kalavri (Boston University) Learning to partition unbounded graph streams – slides, video 19:19 Muhammad Attahir Jibril (TU Ilmenau) Towards a Hybrid OLTP-OLAP Graph Benchmark – slides, video 19:31 Riccardo Tommasini (University of Tartu) An outlook on Benchmarks for Graph Stream Processing – slides, video 19:43 Mohamed Ragab (University of Tartu) Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – slides, video ","permalink":"https://ldbcouncil.org/event/fourteenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Fourteenth TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-2112-06217/","tags":[],"title":"Graph Pattern Matching in GQL and SQL/PGQ"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-angles-bdfhhlllm-21/","tags":[],"title":"PG-Keys: Keys for Property Graphs"},{"categories":null,"contents":"LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.\nLDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.\nThis TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.\nSNB Task Force Progress report ACID compliance test suite Integrating deletions to Datagen Migrating Datagen to Spark Redesign of BI read queries Extensions to the driver Ongoing work Datagen: tuning the distribution of deletes Interactive 2.0 workload BI 1.0 workload Zoom links will be sent through email.\n","permalink":"https://ldbcouncil.org/event/thirteenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Thirteenth TUC Meeting"},{"categories":null,"contents":"LDBC\u0026rsquo;s Social Network Benchmark [4] (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems\u0026rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.\nLDBC SNB provides Datagen (Data Generator), which produces synthetic datasets, mimicking a social network\u0026rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).\nOverview The benchmark\u0026rsquo;s specification describes a social network data model which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see References.\nDatasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).\n\\ Figure 1. LDBC SNB Datagen Process on Hadoop\nIn the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.\nNote: The diagram shows the call sequence as implemented. All steps are sequential \u0026ndash; including the relationship generation \u0026ndash;, even in cases when the data dependencies would allow for parallelization.\nEntities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.1 A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this edge as property representation makes the data harder to handle in SQL than it would be with a flat join table.\nEntity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.2\nSerialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.\nMotivations for the migration The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:\nBetter memory utilization: MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.\nSmaller codebase: The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.\nSmall entry cost: Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.\nIncremental improvements: Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.\nOSS, commodity: Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.\nFirst steps The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.\nUse your memory: A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using MEMORY_AND_DISK). In short, the default caching strategy was used everywhere.\nRegression tests: Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.\nThread-safety concerns: Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn\u0026rsquo;t a concern in the original implementation due to the fact that MapReduce doesn\u0026rsquo;t use thread-based parallelization for mappers and reducers.3 In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, 4 which makes it somewhat harder to find potential unguarded shared variables.\nCase study: Person ranking Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the S3G2 paper [3].\nThe original MapReduce version \\ Figure 2. Diagram of the MapReduce code for ranking persons\nThe implementation, shown in pseudocode above, works as follows:\nThe equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low. The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate \u0026ldquo;side-channel\u0026rdquo; file upon the completion of a reduce task. In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person. Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.\nThe migrated version Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.\nBenchmarks Benchmarks were carried out on AWS EMR, originally utilising i3.xlarge instances because of their fast NVMe SSD storage and ample amount of RAM.\nThe application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.5 The MapReduce results were as follows:\nSF workers Platform Instance Type runtime (min) runtime * worker/SF (min) 10 1 MapReduce i3.xlarge 16 1.60 30 1 MapReduce i3.xlarge 34 1.13 100 3 MapReduce i3.xlarge 40 1.20 300 9 MapReduce i3.xlarge 44 1.32 It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have assed.\nFigure 3. CPU Load for the Map Reduce cluster is bursty and less than\n50% on average (SF100, 2nd graph shows master)\nFigure 4. The job only starts to consume memory when already 10 minutes\ninto the run (SF100, 2nd graph shows master)\nLet\u0026rsquo;s see how Spark fares.\nSF workers Platform Instance Type runtime (min) runtime * worker/SF (min) 10 1 Spark i3.xlarge 10 1.00 30 1 Spark i3.xlarge 21 0.70 100 3 Spark i3.xlarge 27 0.81 300 9 Spark i3.xlarge 36 1.08 1000 30 Spark i3.xlarge 47 1.41 3000 90 Spark i3.xlarge 47 1.41 A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn\u0026rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.\nFigure 5. Full CPU utilization for Spark (SF100, last graph shows\nmaster)\nFigure 6. Spark eats up memory fast (SF100, 2nd graph shows master)\ni3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it only has a 300 GB SSD.\nSF workers Platform Instance Type runtime (min) runtime * worker/SF (min) 100 3 Spark r5d.2xlarge 16 0.48 300 9 Spark r5d.2xlarge 21 0.63 1000 30 Spark r5d.2xlarge 26 0.78 3000 90 Spark r5d.2xlarge 25 0.75 10000 303 Spark r5d.2xlarge 25 0.75 The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.\nNext steps The next improvement is refactoring the serializers so they use Spark\u0026rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.\nAs already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.\nThe Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for generating delete operations [1]. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.\nAcknowledgements This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!\nReferences [1] Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark\u0026rsquo;s Data Generator\n[2] 9th TUC Meeting \u0026ndash; LDBC SNB Datagen Update \u0026ndash; Arnau Prat (UPC) - slides\n[3] S3G2: a Scalable Structure-correlated Social Graph Generator\n[4] The LDBC Social Network Benchmark\n[5] LDBC - LDBC GitHub organization\nAlso makes it easier to map to a tabular format thus it is a SQL friendly representation.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nIt\u0026rsquo;s hard to imagine this done declaratively in SQL.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nInstead, multiple YARN containers have to be used if you want to parallelize on the same machine.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nAlthough editors usually render these using different font styles.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\nWith the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.\u0026#160;\u0026#x21a9;\u0026#xfe0e;\n","permalink":"https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/","tags":["datagen","snb"],"title":"Speeding Up LDBC SNB Datagen"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-04/","tags":[],"title":"LDBC Property Graph Schema contributions to WG3"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-2010-12243/","tags":[],"title":"An analysis of the SIGMOD 2014 Programming Contest: Complex queries on the LDBC social network graph"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-waudby-sps-20/","tags":[],"title":"Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark's Data Generator"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-2011-15028/","tags":[],"title":"The LDBC Graphalytics Benchmark"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-2001-02299/","tags":[],"title":"The LDBC Social Network Benchmark"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conftpctc-waudby-skmbs-20/","tags":[],"title":"Towards Testing ACID Compliance in the LDBC Social Network Benchmark"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-02/","tags":[],"title":"Introduction to GQL Schema design"},{"categories":null,"contents":"LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.\nLDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry \u0026ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.\nThis TUC meeting will be a one-day event on the last Friday of SIGMOD/PODS 2019 in Amsterdam, The Netherlands, in the conference venue of Beurs van Berlage. The room is the Mendes da Silva kamer. Please check its tips for accommodation in Amsterdam.\nNote also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called GRADES-NDA 2019, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).\nWe welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at damaris@ac.upc.edu to register.\n=\u0026gt; registration is free, but required \u0026lt;=\nYou need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.\nTalk proposals can be sent to Peter Boncz, who is also the local organizer. Please also send your slides to this email for archiving on this site.\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.\nAgenda In the TUC meeting, there will be:\nupdates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads. talks by data management practitioners highlighting graph data management challenges and products The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).\nThe TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (room: Mendes da Silva kamer):\n08:30-10:30 LDBC Board Meeting (non-public)\n10:30-11:00 Coffee\n11:00-12:45 Session 1: Graph Benchmarks\n11:00-11:05 Welcome \u0026amp; introduction\n11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap\n11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system\n12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations\n12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics\n12:45-14:00 Lunch\n14:00-16:05 Session 2: Graph Query Languages\n14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report\n14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features, report\n14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard\n15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph\u0026rsquo;s query language\n15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language\n16:05-16:30 Coffee\n16:30-17:50 Session 3: Graph System Performance\n16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark\n16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity pptx\n17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph\n17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data\nIf there is interest, we will organize a social dinner on Friday evening for LDBC attendees.\n","permalink":"https://ldbcouncil.org/event/twelfth-tuc-meeting/","tags":["TUC Meeting"],"title":"Twelfth TUC Meeting"},{"categories":null,"contents":"LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry \u0026ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.\nThis TUC meeting will be a one-day event preceding the SIGMOD/PODS 2018 conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called GRADES-NDA 2018 as well, so you might combine travel.\nWe welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at damaris@ac.upc.edu to register.\n=\u0026gt; registration is free, but required \u0026lt;=\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (boncz@cwi.nl) and Larri (larri@ac.upc.edu). Local organizer is Juan Sequeda (juanfederico@gmail.com).\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.\nAgenda In the TUC meeting there will be:\nupdates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads. talks by data management practitioners highlighting graph data management challenges and products The meeting will start on Friday morning, with a program from 10:30-17:00:\n10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting\n10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo\n11:00-11:30 coffee break\n11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing\n11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC\n12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI\n12:45-14:00 lunch\n14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark\n14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle\n14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service\n15:15-15:40 coffee break\n15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web\n16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph\n16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph\n16:55-17:20 Molham Aref (relational.ai)) - Introducing.. relational.ai\n18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701\nLocation The TUC will be held at the University of Texas at Austin, Department of Computer Science in the Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712 Room: GDC 6.302\nThe GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.\nFrom Austin to SIGMOD/PODS (Houston) on Saturday June 9 Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.\nBus One option is to take a MegaBus that departs from downtown Austin and arrives at downtown Houston.\nThere is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).\nIf you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).\n","permalink":"https://ldbcouncil.org/event/eleventh-tuc-meeting/","tags":["TUC Meeting"],"title":"Eleventh TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-01/","tags":[],"title":"SQL/PGQ data model and graph schema"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confgrades-szarnyas-pampkeb-18/","tags":[],"title":"An early look at the LDBC Social Network Benchmark's Business Intelligence workload"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-angles-abbfglpps-18/","tags":[],"title":"G-CORE: A Core for Future Graph Query Languages"},{"categories":null,"contents":"This will be a one-day event at the VLDB 2017 conference in Munich, Germany on September 1, 2017.\nTopics and activities of interest in these TUC meetings are:\nPresentation on graph data management usage scenarios. Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force. Interaction with the new LDBC Board of Directors and the LDBC organisation officials. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at adiaz@ac.upc.edu to register; registration is free, but required.\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.\nAgenda In the TUC meeting there will be:\nupdates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads. talks by data management practitioners highlighting graph data management challenges selected scientific talks on graph data management technology The meeting will start on Friday morning, with a program from 10:30-17:00\n10:30-12:00: TUC session (public)\nPeter Boncz (CWI): GraphQL task force update - the G-CORE proposal (pptx) Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): LDBC Graphalytics v0.9, Graphalytics Global Competition and Graphalytics Custom Benchmark 12:00-13:30: lunch break\n13:30-15:00: TUC session (public)\nArnau Prat (UPC): Datasynth: Democratizing property graph generation Marcus Paradies (SAP): SAP HANA GraphScript Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform Gaétan Hains (Huawei): Cost semantics for graph queries 15:00-15:30: break\n15:30-17:00: TUC session (public)\nPetra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017 Markus Kaindl (Springer): SN SciGraph \u0026ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset Speakers should aim for a 20-minute talk.\nFurther:\non Friday evening (19:00-21:00) there will be a social dinner at Löwenbräukeller, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich). on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public. Venue The Technical University of Munich (TUM) is hosting that week the VLDB conference; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.\nThe TUC meeting will be held in in Room 2607 alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).\naddress: Technische Universität München (TUM), Arcisstraße 21, 80333 München\nGoogle Maps\n","permalink":"https://ldbcouncil.org/event/tenth-tuc-meeting/","tags":["TUC Meeting"],"title":"Tenth TUC Meeting"},{"categories":null,"contents":"LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.\nThis will be a two-day event at SAP Headquarters in Walldorf, Germany on February 9+10, 2017.\nThis will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:\nTwo day event with one day devoted to User\u0026rsquo;s experiences and one day devoted to benchmarking experiences. Presentation of the benchmarking results for the different benchmarks. Interaction with the new LDBC Board of Directors and the LDBC organisation officials. We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at damaris@ac.upc.edu;\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.\nAgenda In the TUC meeting there will be\nupdates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads. talks by data management practitioners highlighting graph data management challenges selected scientific talks on graph data management technology The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.\nThursday evening (19:00-21:00) there will be a social dinner in Heidelberg.\nFriday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.\nSocial Dinner Address: Hauptstraße 217, 69117 Heidelberg\nTime: 19:00 / 7pm\n(See attachments at the bottom of the page)\nThursday start time title – speaker 9:00 Welcome and logistics - Marcus Paradies (SAP) 9:10 Intro + state of the LDBC - Josep Lluis Larriba Pey (UPC) 9:20 LDBC Graph QL task force - Hannes Voigt (TU Dresden) 9:40 PGQL Status Update and Comparison to LDBC\u0026rsquo;s Graph QL proposals - Oskar van Rest (Oracle Labs) 10:00 Adding shortest-paths to MonetDB - Dean de Leo (CWI) 10:20 coffee 10:50 Evolving Cypher for processing multiple graphs - Stefan Plantikow (Neo Technology) 11:10 Standardizing Graph Database Functionality - An Invitation to Collaborate - Jan Michels (ISO/ANSI SQL, Oracle)\u0026quot; 11:30 Dgraph: Graph database for production environment - Tomasz Zdybal (Dgraph.io) 12:00 lunch 13:00 LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap - Alexandru Iosup (TU Delft) 13:20 LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft) 13:40 LDBC SNB Datagen Update - Arnau Prat (UPC) 14:00 LDBC SNB Business Intelligence Workload: Chokepoint Analysis - Arnau Prat (UPC) 14:20 LDBC Benchmark Cost Specification (+discussion) - Moritz Kaufmann (TU Munich) 14:40 coffee break 15:10 EYWA: the Distributed Graph Engine in Huawei MIND Platform (Yinglong Xia) 15:30 Graph Processing in SAP HANA - Marcus Paradies (SAP) 15:50 Distributed Graph Analytics with Gradoop - Martin Junghanns (Univ Leipzig) 16:10 Distributed graph flows: Cypher on Flink and Gradoop - Max Kießling (Neo Technology) 16:30 closing - Peter Boncz 17:30 end Friday start time title – speaker 9:00 welcome - Peter Boncz 9:20 Graph processing in obi4wan - Frank Smit (OBI4WAN) 9:40 Graph problems in the space domain - Albrecht Schmidt (ESA) 10:00 Medical Ontologies for Healthcare - Michael Neumann (SAP) 10:20 coffee 10:50 The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries - Gabor Szarnyas (BME) 11:10 Efficient sparse matrix computations and their generalization to graph computing applications - Albert-Jan Yzelman (Huawei) 11:30 Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge - Atanas Kyriakov (Ontotext) 12:00 lunch 13:00 LDBC Board of Directors Meeting 17:00 end Logistics Important things to know The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: link\nVenue The TUC meeting will be held in the SAP Headquarters at the SAP Guesthouse Kalipeh (https://www.kalipeh.com). The address is:\nWDF 44 / SAP Guesthouse Kalipeh\nDietmar-Hopp-Allee 15\n69190 Walldorf\nGermany\nMaps and situation Google Maps link\nGetting there By plane There are two airports close to SAP\u0026rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.\nWhen booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.\nThe journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).\nJourney time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).\nDriving directions Traveling from Frankfurt Airport (FRA) to SAP Headquarters:\nDirections to SAP headquarters:\nWhen leaving the airport, follow the highway symbol onto \u0026ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.\u0026rdquo; Follow the A5 to \u0026ldquo;Basel/Karlsruhe/Heidelberg.\u0026rdquo; Take exit 39 \u0026ndash; \u0026ldquo;Walldorf/Wiesloch.\u0026rdquo; Turn left onto B291. Turn right onto Dietmar-Hopp-Allee. (Should you use a navigational system which does not recognize the street name \u0026lsquo;Dietmar-Hopp-Allee\u0026rsquo; please use \u0026lsquo;Neurottstrasse\u0026rsquo; instead.)\nTraveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:\nTo get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.\nDirections to SAP headquarters:\nWhen leaving the airport, follow the highway symbol onto \u0026ldquo;A8/Stuttgart/B27.\u0026rdquo; Stay on A8 and follow the sign for \u0026ldquo;Karlsruhe/Heilbronn/Singen/A8.\u0026rdquo; Follow A8 to Karlsruhe. Take exit 41 \u0026ndash; \u0026ldquo;Dreieck Karlsruhe\u0026rdquo; to merge onto A5 toward \u0026ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).\u0026rdquo; Take exit 39 \u0026ndash; \u0026ldquo;Walldorf/Wiesloch.\u0026rdquo; Turn left onto B291. Turn right onto Dietmar-Hopp-Allee. Parking The closest parking lot to the event location is P7 (see figure above).\nBy Train As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.\nFrom Frankfurt Airport (FRA) to SAP Headquarters\nDirections to SAP headquarters:\nGo to Terminal 1, level T (see overview in Appendix). Go to the AIRail Terminal \u0026ndash; \u0026ldquo;Fernbahnhof\u0026rdquo; (long-distance trains). Choose a connection with the destination train station \u0026ldquo;Wiesloch\u0026ndash;Walldorf\u0026rdquo;. From station \u0026ldquo;Wiesloch\u0026ndash;Walldorf,\u0026rdquo; take bus number 707 or 721 toward \u0026ldquo;Industriegebiet Walldorf, SAP.\u0026rdquo; It is a 10-minute ride to reach bus stop \u0026lsquo;SAP headquarters\u0026rsquo;. From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters\nDirections to SAP headquarters:\nGo to the S-Bahn station in the airport, following the sign (station is called \u0026ldquo;Stuttgart Flughafen/Messe\u0026rdquo;). Take train number S2 or S3 to \u0026ldquo;Stuttgart Hauptbahnhof\u0026rdquo; (main station). From Stuttgart Hauptbahnhof choose a connection with the destination train station \u0026ldquo;Wiesloch\u0026ndash;Walldorf\u0026rdquo;. From station \u0026ldquo;Wiesloch\u0026ndash;Walldorf,\u0026rdquo; take bus number 707 or 721 toward \u0026ldquo;Industriegebiet Walldorf, SAP\u0026rdquo;. It is a 10-minute ride to reach bus stop \u0026lsquo;SAP headquarters\u0026rsquo;. ","permalink":"https://ldbcouncil.org/event/ninth-tuc-meeting/","tags":["TUC Meeting"],"title":"Ninth TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confgrades-leo-b-17/","tags":[],"title":"Extending SQL for Computing Shortest Paths"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confgrades-ngai-hhi-17/","tags":[],"title":"Granula: Toward Fine-grained Performance Analysis of Large-scale Graph Processing Platforms"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confgrades-prat-perez-gskdb-17/","tags":[],"title":"Towards a property graph generator for benchmarking"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-03/","tags":[],"title":"Cypher schema constraints proposal"},{"categories":null,"contents":"LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.\nLDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms. It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.\nTim Hegeman of TU Delft is today presenting the technical paper describing LDBC Graphalytics at the important VLDB (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.\nLDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.\nLearn more: [/ldbc-graphalytics](LDBC Graphalytics)\nGitHub: https://github.com/tudelft-atlarge/graphalytics\n","permalink":"https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/","tags":["benchmark","tu delft","graphalytics"],"title":"LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification"},{"categories":null,"contents":"The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.\nThis will be a two-day event/eighth-tuc-meeting/attachments at Oracle Conference Center in Redwood Shores facility on Wednesday and Thursday June 22-23, 2016.\nThis will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:\nTwo day event/eighth-tuc-meeting/attachments with one day devoted to User\u0026rsquo;s experiences and one day devoted to benchmarking experiences. Presentation of the benchmarking results for the different benchmarks. Interaction with the new LDBC Board of Directors and the LDBC organisation officials. We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at damaris@ac.upc.edu; in order to notify Oracle security in advance, registration requests need to be in by June 12.\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.\nIn this page, you\u0026rsquo;ll find information about the following items:\nAgenda Logistics Date Venue Getting there Accommodation Agenda On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.\nWednesday, 22th of June 2016 (Room 203) (full morning: LDBC Board of Directors meeting)\n12:00 - 13:00 Lunch (provided) 13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome. 13:30 - 14:00 Peter Boncz (CWI) LDBC introduction and status update. 14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey) 14:00 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload. 14:30 Tim Hegeman (TU Delft). Social Network Benchmark, Analytics workload. 15:00 - 15:30 Coffee break 15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi) 15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). Graphing Healthcare Networks: Data, Analytics, and Use Cases. 16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). Frappé: Querying and managing evolving code dependency graphs. 16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). UniProt: challenges of a public SPARQL endpoint. 17:00 - 18:30 Graph Technologies (chair Peter Boncz) 17:00 Eugene I. Chong (Oracle USA). Balancing Act to improve RDF Query Performance in Oracle Database. 17:30 Lijun Chang (University of New South Wales). Efficient Subgraph Matching by Postponing Cartesian Products. 18:00 Weining Qian (East China Normal University). On Statistical Characteristics of Real-Life Knowledge Graphs. Thursday, 23th of June 2016 (Room 203) 08:00 - 09:00 Breakfast (provided) 09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey) 09:00 Peter Boncz (CWI). Query Language Task Force status 09:45 Marcus Paradies (SAP). Social Network Benchmark, Business Intelligence workload 10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest) 10:00 Sergey Edunov (Facebook). Generating realistic trillion-edge graphs 10:30 George Fletcher (TU Eindhoven). An open source framework for schema-driven graph instance and graph query workload generation. 11:00 Yinglong Xia (Huawei Research America): An Efficient Big Graph Analytics Platform. 11:30 Zhe Wu (Oracle USA). Bridging RDF Graph and Property Graph Data Models 12:00 - 13:30 Lunch (provided) 13:30 - 15:30 Graph Technologies (chair Arnau Prat) 13:30 Tobias Lindaaker (Neo Technology). An open standard for graph queries: the Cypher contribution 14:00 Arash Termehchy (Oregon State University). Toward Representation Independent Graph Querying \u0026amp; Analytics 14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). In the service of the federation 15:00 Nandish Jayaram (Pivotal). Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs. 15:30 - 16:00 Coffee break 16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi) 16:00 Jans Aasman (Franz Inc.). Semantic Data Lake for Healthcare 16:15 Kevin Madden (Tom Sawyer Software). Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis 16:45 Juan Sequeda (Capsenta). Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources 17:15 Kevin Wilkinson (Hewlett Packard Labs). LDBC SNB extensions 17:45 - 18:15 Closing discussion Friday, 24th of June 2016 (Room 105) At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (GRADES16).\n18:30 social dinner for GRADES registrants (place to be announced)\nLogistics Date 22nd and 23rd June 2016\nVenue The TUC meeting will be held in the Oracle Conference Center\nThe address is:\nRoom 203 (Wed-Thu) \u0026amp; Room 105 (Fri)\nOracle Conference Center\n350 Oracle Parkway\nRedwood City, CA 94065, USA\nMaps and situation\nGoogle Maps link\nOracle Campus map:\nGetting there Driving directions [Southbound] - Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right. [Northbound] - Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right. Parking The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.\nPublic transport Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.\nCaltrain timetables: http://www.caltrain.com/schedules/weekdaytimetable.html Oracle Shuttle timetables: http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.\nAlternatively, SamTrans (San Mateo County\u0026rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.\n","permalink":"https://ldbcouncil.org/event/eighth-tuc-meeting/","tags":["TUC Meeting"],"title":"Eighth TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsemweb-kotsev-mpefk-16/","tags":[],"title":"Benchmarking RDF Query Engines: The LDBC Semantic Publishing Benchmark"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/","tags":[],"title":"LDBC Graphalytics: A Benchmark for Large-Scale Graph Analysis on Parallel and Distributed Platforms"},{"categories":null,"contents":"Apache Flink [1] is an open source platform for distributed stream and batch data processing. Flink\u0026rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.\nFlink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.\nThe following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:\nDataSet\u0026lt;String\u0026gt; text = env.fromElements( \u0026#34;He who controls the past controls the future.\u0026#34;, \u0026#34;He who controls the present controls the past.\u0026#34;); DataSet\u0026lt;Tuple2\u0026lt;String, Integer\u0026gt;\u0026gt; wordCounts = text .flatMap(new LineSplitter()) // splits the line and outputs (word,1) tuples.groupBy(0) // group by word .sum(1); // sum the 1\u0026#39;s wordCounts.print(); At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop [2]. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing [3]. Using the class LDBCToFlink, LDBC output files can be read directly from HDFS or from the local file system:\nfinal ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); final LDBCToFlink ldbcToFlink = new LDBCToFlink( \u0026#34;hdfs:///ldbc_snb_datagen/social_network\u0026#34;, // or \u0026#34;/path/to/social_network\u0026#34; env); DataSet\u0026lt;LDBCVertex\u0026gt; vertices = ldbcToFlink.getVertices(); DataSet\u0026lt;LDBCEdge\u0026gt; edges = ldbcToFlink.getEdges(); The tuple classes LDBCVertex and LDBCEdge hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.\nEach LDBCVertex instance contains:\nan identifier, which is unique among all vertices * a vertex label (e.g. Person, Comment) * a key-value map of properties including also multivalued properties\n(e.g. Person.email) Each LDBCEdge instance contains:\nan identifier, which is unique among all edges an edge label (e.g. knows, likes) a source vertex identifier a target vertex identifier a key-value map of properties The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label Person and edges with the label knows and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub [4].\nfinal ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); final LDBCToFlink ldbcToFlink = new LDBCToFlink( \u0026#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network\u0026#34;, env); // filter vertices with label “Person” DataSet\u0026lt;LDBCVertex\u0026gt; ldbcVertices = ldbcToFlink.getVertices() .filter(new VertexLabelFilter(LDBCConstants.VERTEX_CLASS_PERSON)); // filter edges with label “knows” DataSet\u0026lt;LDBCEdge\u0026gt; ldbcEdges = ldbcToFlink.getEdges() .filter(new EdgeLabelFilter(LDBCConstants.EDGE_CLASS_KNOWS)); // create Gelly vertices suitable for connected components DataSet\u0026lt;Vertex\u0026lt;Long, Long\u0026gt;\u0026gt; vertices = ldbcVertices.map(new VertexInitializer()); // create Gelly edges suitable for connected components DataSet\u0026lt;Edge\u0026lt;Long, NullValue\u0026gt;\u0026gt; edges = ldbcEdges.map(new EdgeInitializer()); // create Gelly graph Graph\u0026lt;Long, Long, NullValue\u0026gt; g = Graph.fromDataSet(vertices, edges, env); // run connected components on the subgraph for 10 iterations DataSet\u0026lt;Vertex\u0026lt;Long, Long\u0026gt;\u0026gt; components = g.run(new ConnectedComponents\u0026lt;Long, NullValue\u0026gt;(10)); // print the component id of the first 10 vertices components.first(10).print(); The ldbc-flink-import tool is available on Github [3] and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.\nIf you want to learn more about Apache Flink, a good starting point is the main documentation [5] and if you have any question feel free to ask the official mailing lists.\nThere is also a nice set of videos [6] available from the latest Flink Forward conference.\nReferences [1] http://flink.apache.org/\n[2] https://github.com/dbs-leipzig/gradoop\n[3] https://github.com/s1ck/ldbc-flink-import\n[4] https://gist.github.com/s1ck/b33e6a4874c15c35cd16\n[5] https://ci.apache.org/projects/flink/flink-docs-release-0.10/\n[6] https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA\n","permalink":"https://ldbcouncil.org/post/ldbc-and-apache-flink/","tags":["flink","datagen","snb"],"title":"LDBC and Apache Flink"},{"categories":null,"contents":"The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.\nThis will be a two-day event at IBM\u0026rsquo;s TJ Watson facility on Monday and Tuesday November 9/10, 2015.\nThis will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:\nTwo day event with one day devoted to User\u0026rsquo;s experiences and one day devoted to benchmarking experiences. Presentation of the benchmarking results for the different benchmarks. Interaction with the new LDBC Board of Directors and the LDBC organisation officials. We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at damaris@ac.upc.edu; in order to notify IBM security in advance, registration requests need to be in by Nov 1.\nIn the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.\nFurther, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.\nIn this page, you\u0026rsquo;ll find information about the following items:\nAgenda Logistics\n- Date\n- Venue\n- Maps and situation\n- Getting there Agenda Monday, 9th of November 2015\n8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)\n9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)\n9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)\n9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload\n10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload\n10:30-11:00 Coffee break\n11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)\n11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.\n11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.\n12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status\n12:30 - 14:00 Lunch break\n14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)\n14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox\n14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today\u0026rsquo;s architectures\n15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G\n15:30-16:00 Coffee break\n16:00 - 17:00 Technologies (chair Irini Fundulaki)\n16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store\n16:30 David Ediger (GeorgiaTech). STINGER\n17:00 Gary King (Franz Inc.). AllegroGraph\u0026rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties\n17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics\n18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase\n19:00 Social dinner\nTuesday 10th November 2015\n9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)\n9:00 Philip Rathle (Neo). On openCypher\n9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification\n9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions\n10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation\n10:30 - 11:00 Coffee break\n11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)\n11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL\n11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,\n11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis\n12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives\n12:30 - 14:00 Lunch break\n14:00 LDBC Board of Directors\nLogistics Date 9th and 10th November 2015\nVenue The TUC meeting will be held in the IBM Thomas J Watson Research Center.\nThe address is:\nIBM Thomas J Watson Research Center\n1101 Kitchawan Rd,\nYorktown Heights, NY 10598, USA\nIf you are using a GPS system, please enter \u0026ldquo;200 Aqueduct Road, Ossining NY, 10562\u0026rdquo; for accurate directions to the lab entrance. You may also want to check the routing online.\nThe meeting will take place in the Auditorium on November 9th, and in Meeting Room 20-043 on November 10th.\nMaps and situation You are highly suggested to rent a car for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through www.orbitz.com, or www.expedia.com Feel free to email yxia@us.ibm.com for any questions.\nGetting there Upper and Eastern New England\nRoute I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.\nNew Haven and Connecticut Shores\nMerritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.\nNew Jersey\nTake New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.\nUpstate New York\nRoute I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.\nNew York City (Manhattan)\nHenry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.\nJohn F. Kennedy International Airport\nNorth on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.\nLaGuardia Airport\nEast on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.\nNewark International Airport\nNorth on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.\nStewart International Airport\nRoute 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.\nWestchester County Airport\nRight on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.\nPublic Transportation\nMetropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.\n","permalink":"https://ldbcouncil.org/event/seventh-tuc-meeting/","tags":["TUC Meeting"],"title":"Seventh TUC Meeting"},{"categories":null,"contents":"The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using instance matching techniques and tools. Instance matching is also known as record linkage [1], duplicate detection [2], entity resolution [3] and object identification [4].\nFor instance, a search in Geonames (http://www.geonames.org/) for \u0026ldquo;Athens\u0026rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (http://dbpedia.org/) or Open Government Datasets (http://data.gov.gr/). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.\nWeb resources are published by \u0026ldquo;autonomous agents\u0026rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years [2][5].\nIt is though essential at this point to develop, along with instance and entity matching systems, instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.\nAn instance matching benchmark for Linked Data consists of a source and target dataset implementing a set of test-cases, where each test case addresses a different kind of requirement regarding instance matching, a ground truth or gold standard and finally the evaluation metrics used to assess the benchmark.\nDatasets are the raw material of a benchmark. A benchmark comprises of a source and target dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their nature (real or synthetic), (b) the schemas/ontologies they use, (c) their domains, (d) the languages they are written in, and (e) the variations/heterogeneities of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. Synthetic datasets are generated using automated data generators and are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner\nDatasets (and benchmarks) may contain different kinds of variations that correspond to different test cases. According to Ferrara et.al. [6][7], three kinds of variations exist for Linked Data, namely data variations, structural variations and logical variations. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.\nThe common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.\nThe gold standard is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.\nLast, an instance matching benchmark uses evaluation metrics to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect. On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard precision, recall and f-measure metrics.\nReferences [1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.\n[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau, B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).\n[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.\n[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.\n[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.\n[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).\n[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.\n","permalink":"https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/","tags":["instance matching","spb"],"title":"Elements of Instance Matching Benchmarks: a Short Overview"},{"categories":null,"contents":"In this post we will look at running the LDBC SNB on Virtuoso.\nFirst, let\u0026rsquo;s recap what the benchmark is about:\nfairly frequent short updates, with no update contention worth mentioning\nshort random lookups\nmedium complex queries centered around a person\u0026rsquo;s social environment\nThe updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.\nThe DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, per se, since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.\nThe workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.\nThe test system is the same as used in the TPC-H series: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the feature/analytics branch of v7fasttrack, available from www.github.com.\nThe dataset is the SNB 300G set, with:\n1,136,127 persons 125,249,604 knows edges 847,886,644 posts, including replies 1,145,893,841 tags of posts or replies 1,140,226,235 likes of posts or replies As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.\nBelow are the numerical quantities for a 400K operation run after 150K operations worth of warmup.\nDuration: 10:41.251\nThroughput: 623.71 (op/s)\nThe statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.\n% of total total_wait name count mean min max 20% 4,231,130 LdbcQuery5 656 6,449.89 245 10,311 11% 2,272,954 LdbcQuery8 18,354 123.84 14 2,240 10% 2,200,718 LdbcQuery3 388 5,671.95 468 17,368 7.3% 1,561,382 LdbcQuery14 1,124 1,389.13 4 5,724 6.7% 1,441,575 LdbcQuery12 1,252 1,151.42 15 3,273 6.5% 1,396,932 LdbcQuery10 1,252 1,115.76 13 4,743 5% 1,064,457 LdbcShortQuery3PersonFriends 46,285 22.9979 0 2,287 4.9% 1,047,536 LdbcShortQuery2PersonPosts 46,285 22.6323 0 2,156 4.1% 885,102 LdbcQuery6 1,721 514.295 8 5,227 3.3% 707,901 LdbcQuery1 2,117 334.389 28 3,467 2.4% 521,738 LdbcQuery4 1,530 341.005 49 2,774 2.1% 440,197 LdbcShortQuery4MessageContent 46,302 9.50708 0 2,015 1.9% 407,450 LdbcUpdate5AddForumMembership 14,338 28.4175 0 2,008 1.9% 405,243 LdbcShortQuery7MessageReplies 46,302 8.75217 0 2,112 1.9% 404,002 LdbcShortQuery6MessageForum 46,302 8.72537 0 1,968 1.8% 387,044 LdbcUpdate3AddCommentLike 12,659 30.5746 0 2,060 1.7% 361,290 LdbcShortQuery1PersonProfile 46,285 7.80577 0 2,015 1.6% 334,409 LdbcShortQuery5MessageCreator 46,302 7.22234 0 2,055 1% 220,740 LdbcQuery2 1,488 148.347 2 2,504 0.96% 205,910 LdbcQuery7 1,721 119.646 11 2,295 0.93% 198,971 LdbcUpdate2AddPostLike 5,974 33.3062 0 1,987 0.88% 189,871 LdbcQuery11 2,294 82.7685 4 2,219 0.85% 182,964 LdbcQuery13 2,898 63.1346 1 2,201 0.74% 158,188 LdbcQuery9 78 2,028.05 1,108 4,183 0.67% 143,457 LdbcUpdate7AddComment 3,986 35.9902 1 1,912 0.26% 54,947 LdbcUpdate8AddFriendship 571 96.2294 1 988 0.2% 43,451 LdbcUpdate6AddPost 1,386 31.3499 1 2,060 0.01% 1,848 LdbcUpdate4AddForum 103 17.9417 1 65 0.00% 44 LdbcUpdate1AddPerson 2 22 10 34 At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.\nThe implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.\nThe set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:\nCardinality estimation under heavy data skew — Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.\nCovering indices — Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post\u0026rsquo;s creation date.\nMulti-hop graph traversal — Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.\nTop K — Most queries returning posts order results by descending date. Once there are at least k results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top k.\nLate projection — Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.\nMaterialization — Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.\nConcurrency control — Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.\nIn subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.\nSNB Interactive Series SNB Interactive, Part 1: What is SNB Interactive Really About? SNB Interactive, Part 2: Modeling Choices SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso ","permalink":"https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/","tags":["snb","interactive"],"title":"SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso"},{"categories":null,"contents":"Next 31st of May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.\nAmong the papers published in this edition we have \u0026ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms\u0026rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in https://github.com/ldbc) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have \u0026ldquo;Microblogging Queries on Graph Databases: an Introspection\u0026rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention \u0026ldquo;Frappé: Querying the Linux Kernel Dependency Graph\u0026rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.\nCheck the complete agenda.\nMeet you in Melbourne!\n","permalink":"https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/","tags":["sigmod","graphalytics","grades","snb","datagen","workshop"],"title":"SNB and Graphs Related Presentations at GRADES '15"},{"categories":null,"contents":"​SNB Interactive is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.\nIn the case of Virtuoso, we have played with SQL and SPARQL implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.\nSchema Design SNB has a regular schema described by a UML diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.\nThe only table-level choice has to do with whether posts and comments are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.\nThe workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key of ps_creatorid, ps_creationdate, ps_postid pays off since the top-k on creationdate can be pushed down into the index without needing a reference to the table.\nThe implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the Sparksee and Neo4J implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.\nThe benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 \u0026ldquo;top of the wall\u0026rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. person1, person2 -\u0026gt; weight. Person1 is by convention the one with the smaller p_personid. Note that comparing id\u0026rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI\u0026rsquo;s with disastrous performance implications unless an implementation specific trick were used.\nIn the next installment we will analyze an actual run.\nSNB Interactive Series SNB Interactive, Part 1: What is SNB Interactive Really About? SNB Interactive, Part 2: Modeling Choices SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso ","permalink":"https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/","tags":["snb","virtuoso","interactive"],"title":"SNB Interactive Part 2: Modeling Choices"},{"categories":null,"contents":"LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.\nOn the industry track, LDBC will be presenting the Social Network Benchmark Interactive Workload by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).\nYou can read more about the Social Network Benchmark here and collaborate if you\u0026rsquo;re interested!\nThe other presentation will be at the GRADES workshop within the SIGMOD program regarding Graphalytics: A Big Data Benchmark for Graph-Processing platforms by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.\nDon\u0026rsquo;t forget to check our presentations if you\u0026rsquo;re attending the SIGMOD!\n","permalink":"https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/","tags":["sigmod","grades","snb","graphalytics","workshop"],"title":"LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference"},{"categories":null,"contents":"This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.\nWith two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.\nThe essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.\nSo far, we see that SNB confronts the implementor with choices in the following areas:\nData model: Relational, RF, property graph? Physical model, e.g. row-wise vs. column wise storage Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc. Parameters vs. literals: Sometimes different parameter values result in different optimal query plans Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing. In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.\nData generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option. Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce? Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a \u0026lsquo;fast\u0026rsquo; and \u0026lsquo;slow\u0026rsquo; case of a single query template. How long does one need to run to balance these fluctuations? Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput. Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time. If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse. Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable. Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy? Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters? The following posts will look at the above in light of actual experience.\nSNB Interactive Series SNB Interactive, Part 1: What is SNB Interactive Really About? SNB Interactive, Part 2: Modeling Choices SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso ","permalink":"https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/","tags":["snb","virtuoso","interactive"],"title":"SNB Interactive Part 1: What Is SNB Interactive Really About?"},{"categories":null,"contents":"In a previous 3-part blog series we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn\u0026rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - \u0026ldquo;graph\u0026rdquo; is the word that best captures the novelty and difficulty of this work.\nWorkload Execution - Traditional vs Graph\nTransactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.\nTo understand what is meant by \u0026ldquo;traditional relational workloads\u0026rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, \u0026ldquo;dependency\u0026rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator\u0026rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system. TPC-C, however, does not do this and instead only asks for the status of the last order for a given user. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.\nA significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user\u0026rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.\nSuch scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend\u0026rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.\nBecause it\u0026rsquo;s a graph\nIn short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.\n","permalink":"https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/","tags":["snb","driver","interactive"],"title":"Why Do We Need an LDBC SNB-Specific Workload Driver?"},{"categories":null,"contents":"As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.\nFirst of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:\nThe wall of the person\nThe albums of the person\nThe groups where the person is a moderator\nWe will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.\nAfter assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.\nFlashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to \u0026ldquo;Enrique Iglesias\u0026rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.\nOnce the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:\nDetermine the number of posts to generate\nSelect a random member of the group that will generate the post\nDetermine the event the post will be related to given the aforementioned cumulative distribution\nAssign the date of the post based on the event date\nIn order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from [1]. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.\nFollowing the example of \u0026ldquo;Enrique Iglesias\u0026rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.\nIn this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.\nReferences [1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506\n","permalink":"https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/","tags":["datagen","social network","snb"],"title":"Event Driven Post Generation in Datagen"},{"categories":null,"contents":"The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.\nThis will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on Thursday and Friday March 19/20, 2015.\nThe LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:\nTwo day event with one day devoted to User\u0026rsquo;s experiences and one day devoted to benchmarking experiences. Presentation of the first benchmarking results for the different benchmarks. Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials. Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations. We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact damaris@ac.upc.edu.\nAgenda Thursday 19th March\n11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)\n11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – slides\n12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)\n12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – slides\n12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain\n12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive\n13:10 Claudio Martella (VUA): Giraph and Lighthouse\n13:30 - 14:30 Lunch break\n14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)\n14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production slides\n14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services slides\n15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph slides\n15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs\n18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.\n20:00 Social dinner at Bastaix Restaurant.\nFriday 20th March\n9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)\n9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics\n9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms\n10:10 John Snelson (MarkLogic): Introduction to MarkLogic\n10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload\n10:50 Moritz Kaufmann. The auditing experience\n11:15 - 11:45 Coffee break\n11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)\n11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox\n12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data\n12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments\n12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. slides\n13:30 - 14:30 Lunch break\n15:00 LDBC Board of Directors\nLogistics Date 19th and 20th March 2015\nVenue The TUC meeting will be held at \u0026ldquo;Aula Master\u0026rdquo; at A3 building located inside the \u0026ldquo;Campus Nord UPC\u0026rdquo; in Barcelona. The address is:\nAula Master\nEdifici A3, Campus Nord UPC\nC. Jordi Girona, 1-3\n08034 Barcelona, Spain\nMaps and situation To reach the campus, there are several options, including Taxi, Metro and Bus.\nFinding UPC Finding the meeting room Getting there Flying: Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this map of the airport). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.\nRail: The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to\nthe centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.\nBus: The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.\nTaxi: From the airport, you can take one of Barcelona\u0026rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.\nTrain and bus: Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: http://www.barcelona-airport.com/eng/transport_eng.htm\nThe locations of the airport and the city centre ","permalink":"https://ldbcouncil.org/event/sixth-tuc-meeting/","tags":["TUC Meeting"],"title":"Sixth TUC Meeting"},{"categories":null,"contents":"This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.\nWhen generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.\nThe first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 [1]. Here we summarize the paper and its contributions and findings.\nExisting synthetic graph generators such as Rmat [1] and Mag [2], are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR [3], a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.\nHowever, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of [1] set up an experiment where they analized the characteristics of the communities output by LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to [4].\nNodes Edges Amazon 334863 925872 Dblp 317080 1049866 Youtube 1134890 2987624 Livejournal 3997962 34681189 The authors of [1] selected a set of statistical indicators to\ncharacterize the communities:\nThe clustering coefficient The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community. The bridge ratio, which is the ratio of edges whose removal disconnects the community. The diameter The conductance The size The authors start by analyzing each community of the ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.\nMany of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community. Most of the communities are small (10 or less nodes). In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity. Clustering Coefficient TPR Bridge Ratio Diameter Conductance Size The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.\nClustering Coefficient TPR Bridge Ratio TPRDiameter Conductance Size The main conclusions that can be extracted from DATAGEN can be summarized asfollows:\nDATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio. The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs. Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger. The diameter is small like in the real graphs. It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics. Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:\nLFR graphs donot show the multimodal distribution observed in real graphs Only the diameter shows a similar shape as in the ground truth. Clustering Coefficient TPR Bridge Ratio TPRDiameter Conductance Size To better quanify how similar are the distribuions between the different graphs, the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman\u0026rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.\nClustering Coefficient TPR Bridge Ratio TPRDiameter Conductance Size We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!\nReferences [1] Arnau Prat-Pérez, David Domínguez-Sal: How community-like is the structure of synthetically generated graphs? GRADES 2014\n[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014\n[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics\n[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.\n","permalink":"https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/","tags":["datagen","social network","snb"],"title":"The LDBC Datagen Community Structure"},{"categories":null,"contents":"Publishing and media businesses are going through transformation I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.\nWhat’s driving this change in publishing and media?\nWidespread and instantaneous distribution of information over the Internet has turned news into somewhat of a \u0026ldquo;commodity\u0026rdquo; and few people are willing to pay for it\nThe wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;\nOpen access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.\nAlongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.\nImagine instant news in context, Imagine personal channels, Imagine \u0026hellip; triplestores While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in \u0026ldquo;near real time\u0026rdquo; is difficult and expensive using legacy processes and content management technology.\nAnother example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like Factiva, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.\nFinally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.\nMany publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:\nGeneration of rich and \u0026ldquo;meaningful\u0026rdquo; (trying not to use \u0026ldquo;semantic\u0026rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery. In this post I write about \u0026ldquo;semantic annotation\u0026rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.\nSemantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing The most popular meaning of \u0026ldquo;semantic annotation\u0026rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.\nThe concept of using text-mining for automatic semantic annotation of text with respect to very large datasets, such as DBPedia, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether \u0026ldquo;Paris\u0026rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether \u0026ldquo;Hilton\u0026rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.\nToday there are plenty of tools (such as the Ontotext Media and Publishing platform and DBPedia Spotlight) and services (such as Thomson Reuter’s OpenCalais and Ontotext’s S4) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.\nThe BBC’s Dynamic Semantic Publishing (DSP) Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.\nBBC Future Media \u0026amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.\n\u0026ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories\u0026rdquo;. \u0026ndash; Jem Rayfield, Senior Technical Architect, BBC News and Knowledge\nThe Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (\u0026ldquo;edited by exception\u0026rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.\n\u0026ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A natural language and ontological determiner process automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.\nJournalist-published metadata is captured and made persistent for querying using the resource description framework (RDF) metadata representation and triple store technology. A RDF triplestore and SPARQL approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept \u0026ldquo;Frank Lampard\u0026rdquo;, then the framework infers and applies concepts such as \u0026ldquo;England Squad\u0026rdquo;, \u0026ldquo;Group C\u0026rdquo; and \u0026ldquo;FIFA World Cup 2010\u0026rdquo; \u0026hellip;\u0026rdquo; \u0026ndash; Jem Rayfield\nOne can consider each of the \u0026ldquo;aggregation pages\u0026rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.\n\u0026ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content\n…we are not publishing pages, but publishing content as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.\n… The index pages are published automatically. This process is what assures us of the highest quality output, but still save large amounts of time in managing the site and makes it possible for us to efficiently run so many pages for the World Cup.\u0026rdquo; \u0026ndash; John O\u0026rsquo;Donovan, Chief Technical Architect, BBC Future Media \u0026amp; Technology\nTo get a real feeling about the load of the triplestore behind BBC\u0026rsquo;s World Cup web site, here are some statistics:\n800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;\nAverage unique page requests/day: 2 million;\nAverage SPARQL queries/day: 1 million;\n100s repository updates/inserts per minute with OWL 2 RL reasoning;\nMulti data center that is fully resilient, clustered 6 node triplestore.\nThe Semantic Publishing Benchmark LDBC\u0026rsquo;s Semantic Publishing Benchmark (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).\nSPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:\nReference knowledge: taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);\nMetadata for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.\nIn this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:\nAggregation queries retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;\nUpdates, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.\nSPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from Geonames for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.\nA more technical introduction to SPB can be found in this post. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this post. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.\nDespite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of \u0026ldquo;fast flowing\u0026rdquo; content need to be \u0026ldquo;dispatched\u0026rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:\nThe Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;\nReasoning is needed to map content descriptions to queries in a flexible manner;\nThere are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.\nSPB v.2.0 – steeper for the engines, closer to the publishers We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.\nThe major changes in SPB v.2.0 can be summarized as follows:\nMuch bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;\nBetter interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;\nRetrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.\n","permalink":"https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/","tags":["industry","spb"],"title":"Industry Relevance of the Semantic Publishing Benchmark"},{"categories":null,"contents":"The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.\nIn this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.\nOWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.\nThis richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.\nThe aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found here.\nSchema-Based Optimization Techniques Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.\nA simple first case is the case of constraint violation. Consider the query below, which returns all instances of class \u0026lt;A\u0026gt; which are fillers of a specific property \u0026lt;P\u0026gt;. If the underlying schema contains the information that the range of \u0026lt;P\u0026gt; is class \u0026lt;B\u0026gt;, and that class \u0026lt;B\u0026gt; is disjoint from class \u0026lt;A\u0026gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.\nSELECT ?v WHERE { ?v rdf : type \u0026lt;A\u0026gt; . ?u \u0026lt;P\u0026gt; ?v . ?u \u0026lt;P\u0026gt; ?v1 . ?u \u0026lt;P1 \u0026gt; ?v2 . ?u \u0026lt;P2 \u0026gt; ?v3 . ?u \u0026lt;P3 \u0026gt; ?v4 . ?u \u0026lt;P4 \u0026gt; ?v5} Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class \u0026lt;A1\u0026gt; can immediately be identified as not being in the answer set.\nSELECT ?c WHERE { ?x rdf: type ?c . ?x \u0026lt;P\u0026gt; ?y . FILTER NOT EXISTS \\{ ?x rdf: type \u0026lt;A1 \u0026gt; }} Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.\nSimilarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).\nAs an example of these patterns, consider the query below, where class \u0026lt;C\u0026gt; is defined as the intersection of classes \u0026lt;C1\u0026gt;, \u0026lt;C2\u0026gt;. Thus, the triple pattern (?x rdf:type \u0026lt;C\u0026gt;) is more selective than (?y rdf:type \u0026lt;C1\u0026gt;) and (?z rdf:type \u0026lt;C2\u0026gt;) and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.\nSELECT ?x WHERE { ?x rdf: type \u0026lt;C\u0026gt; . ?x \u0026lt;P1 \u0026gt; ?y . ?y rdf : type \u0026lt;C1 \u0026gt; . ?y \u0026lt;P2 \u0026gt; ?z . ?z rdf : type \u0026lt;C2 \u0026gt; } Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property P4 is a symmetric property.\nSELECT ?y ?y1 ?y2 ?y3 WHERE { ?x \u0026lt;P1 \u0026gt; ?y . ?x \u0026lt;P2 \u0026gt; ?y1 . ?x \u0026lt;P3 \u0026gt; ?y2 . ?y3 \u0026lt;P4 \u0026gt; ?x } Conclusion In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:\nCases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results. Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing. Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query. Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques. This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.\n","permalink":"https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/","tags":["developer","industry"],"title":"OWL-Empowered SPARQL Query Optimization"},{"categories":null,"contents":"When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.\nWhen looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.\nReaslistic Message Content Messages\u0026rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post\u0026rsquo;s tags to other related or randomly selected tags.\nNon uniform activity levels In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.\nTime correlated post and comment generation In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in [1]. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.\nAs we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.\nIn this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.\nReferences [1] Leskovec, J., Backstrom, L., \u0026amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining (pp. 497-506). ACM.\n","permalink":"https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/","tags":["snb","datagen"],"title":"Person Activity Subgraph Features in LDBC DATAGEN"},{"categories":null,"contents":"The SNB Driver part 1 post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we\u0026rsquo;ll drill down deeper into the details of what it means to execute \u0026ldquo;dependent queries\u0026rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.\nDefinitions Simulation Time (ST): notion of time created by data generator. All time stamps in the generated data set are in simulation time\nReal Time (RT): wall clock time\nTime Compression Ratio: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark\nOperation: read and/or write\nDependencies: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed\nDependents: operations in this set are dependent on at least one other operation (in Dependencies) in the workload\nDue Time (DueT): point in simulation time at which the execution of an operation should be initiated.\nDependent Time (DepT): in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.\nSafe Time (SafeT): time duration.\nwhen two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them\nSafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents\n​Operation Stream: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)\nInitiated Operations: operations that have started executing but not yet finished\nLocal Completion Time (per driver): point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))\nGlobal Completion Time (GCT): minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​\nExecution Window (Window): a timespan within which all operations can be safely executed\nAll operations satisfying window.startTime \u0026lt;= operation.DueT \u0026lt; window.endTime may be executed\nWithin a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window\nTo ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 \u0026lt; window.duration \u0026lt;= SafeT\nWindow duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable\nBefore any operations within a window can start executing it is required that: GCT \u0026gt;= window.startTime - (SafeT - window.duration)\nAll operations within a window must initiate and complete between window start and end times: window.startTime \u0026lt;= operation.initiate \u0026lt; window.endTime and window.startTime \u0026lt;= operation.complete \u0026lt; window.endTime\nDependency Mode: defines dependencies, constraints on operation execution order\nExecution Mode: defines how the runtime should execute operations of a given type\nTracking Dependencies Now, the fun part, making sure dependent operations are executed in the correct order.\nConsider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).\nLogically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:\nthe set of operations that have started executing but not yet finished. Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:\nthe set of operations that have started and finished executing. Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):\nthe point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time. LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:\nDue Time: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled\nGCT: every operation (from Dependencies) with a Due Time before this point in time has completed execution\nHowever, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:\nin addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute. Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.\nScalable execution in the Presence of Dependencies The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:\na) make the generated load less \u0026lsquo;bursty\u0026rsquo;\nb) allow the driver to \u0026lsquo;scale\u0026rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.\nIn the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.\nThe reasons this approach is correct are as follows:\nOperations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked\nThe minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)\nA window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until\nGCT \u0026gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT\nThe advantages of such an execution mode are as follows:\nAs no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window\nThen, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic\nFurther, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to \u0026lsquo;smoothen\u0026rsquo; the load within a Window.\nAs with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between \u0026lsquo;workload resolution\u0026rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the \u0026lsquo;bursty\u0026rsquo; part of the event stream.\nFigure 1. Window scheduling\nThis design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - \u0026lsquo;what happens in the window stays in the window\u0026rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.\n","permalink":"https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/","tags":["snb","driver","interactive"],"title":"SNB Driver - Part 2: Tracking Dependencies Between Queries"},{"categories":null,"contents":"Up until now we have introduced the challenges faced when executing the LDBC SNB benchmark, as well as explained how some of these are overcome. With the foundations laid, we can now explain precisely how operations are executed.\nBased on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.\nDependency Modes While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.\nAnother way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:\n• None\nDepended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)\n– Prior Execution: do nothing – After Execution: do nothing\n• Read Only\nDepended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)\nDependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)\n– Prior Execution: wait for GCT \u0026gt;= operation.DepTime – After Execution: do nothing\n• Write Only\nDepended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)\nDependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)\n– Prior Execution: add operation to Initiated Operations\n– After Execution: remove operation from Initiated Operations, add operation to Completed Operations\n• Read Write\nDepended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)\nDependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)\n– Prior Execution: add operation to Initiated Operations, wait for GCT \u0026lt; operation.DepT\n– After Execution: remove operation from Initiated Operations, add operation to Completed Operations\nExecution Modes Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.\n• Asynchronous: operations are executed individually, when their Due Time arrives.\nMotivation: This is the default execution mode, it executes operations as true to the workload definition as possible.\n– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time \u0026gt;= operation.DueT (and GCT \u0026gt;= operation.DepT)\n– Max Concurrent Executions: unbounded\n– Max Execution Time: unbounded\n– Failure: operation execution starts later than: operation.DueT Tolerated Delay\n• Synchronous: operations are executed individually, sequentially, in blocking manner.\nMotivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.\nThe alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.\n– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler\n– Execute When time \u0026gt;= operation.DueT and previousOperation.completed == true (and GCT \u0026gt;= operation.DepT)\n– Max Concurrent Executions: 1\n– Max Execution Time: nextOperation.DueT - operation.DueT\n– Failure: operation execution starts later than: operation.DueT Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay\n• Partially Synchronous (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together\n– Re-scheduling Before Execution: Yes, as long as the following still holds:\nwindow.startTime \u0026lt;= operation.DueT \u0026lt; window.startTime + window.duration\nOperations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified\n– Execute When time \u0026gt;= operation.DueT (and GCT \u0026gt;= operation.DepT)\n– Max Concurrent Executions: number of operations within window\n– Max Execution Time: (window.startTime + window.duration) - operation.DueT\n– Failure: operation execution starts later than: window.startTime window.duration operation execution does not finish by: window.startTime + window.duration\nTying it back to LDBC SNB The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.\nThe LDBC SNB data can in fact be seen as a union of two parts:\nCore Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.\nUser Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the \u0026ldquo;core\u0026rdquo; part are satisfied (i.e., users don\u0026rsquo;t post things before the profiles are created, etc.).\nIn order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.\nThis property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.\nOn the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).\n","permalink":"https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/","tags":["snb","driver","interactive"],"title":"SNB Driver - Part 3: Workload Execution Putting It All Together"},{"categories":null,"contents":"Until now we have discussed several aspects of the Semantic Publishing Benchmark (SPB) such as the difference in performance between virtual and real servers configuration, how to choose an appropriate query mix for a benchmark run and our experience with using SPB in the development process of GraphDB for finding performance issues.\nIn this post we provide a step-by-step guide on how to run SPB using the Sesame RDF data store on a fresh install of Ubuntu Server 14.04.1. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.\nPrerequisites We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:\nGit Apache Ant 1.8 or higher OpenJDK 6 or Oracle JDK 6 or higher Apache Tomcat 7 or higher If you already have these components installed on your machine you can directly proceed to the next section: Installing Sesame\nFollowing are sample commands which can be used to install the required software components:\nsudo apt-get install git sudo apt-get install ant sudo apt-get install default-jdk sudo apt-get install tomcat7 Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.\nAfter a successful installation of Apache Tomcat you should be able to get the default splash page “It works” when you open your web browser and enter the following address: http://\u0026lt;your_ip_address\u0026gt;:8080\nInstalling Sesame We will use current Sesame version 2.7.14. You can download it here or run following command:\nwget \\\\ \u0026#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download\u0026#34; \\\\ -O openrdf-sesame-2.7.14-sdk.tar.gz Then extract the Sesame tarball:\ntar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz To deploy sesame you have to copy the two war files that are in openrdf-sesame-2.7.14/war to /var/lib/tomcat7/webapps\nFrom openrdf-sesame-2.7.14/war you can do it with command:\ncp openrdf-*.war \u0026lt;tomcat_install\u0026gt;/webapps Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.\nBy default the configuration directory is: /usr/share/tomcat7/.aduna\nCreate the directory:\nsudo mkdir /usr/share/tomcat7/.aduna Then change the ownership:\nsudo chown tomcat7 /usr/share/tomcat7/.aduna And finally you should give the necessary permissions:\nsudo chmod o+rwx /usr/share/tomcat7/.aduna Now when you go to: http://\u0026lt;your_ip_address\u0026gt;:8080/openrdf-workbench/repositories\nYou should get a screen like this:\nSetup SPB You can download the SPB code and find brief documentation on GitHub:\nhttps://github.com/ldbc/ldbc_spb_bm\nA detailed documentation is located here:\nhttps://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf\nSPB offers many configuration options which control various features of the benchmark e.g.:\nquery mixes dataset size loading datasets number of agents validating results test conformance to OWL2-RL ruleset update rate of agents Here we demonstrate how to generate a dataset and execute a simple test\nrun with it.\nFirst download the SPB source code from the repository:\ngit clone https://github.com/ldbc/ldbc_spb_bm.git Then in the ldbc_spb_bm directory build the project:\nant build-basic-querymix If you simply execute the command:\nant you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.\nDepending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat\u0026rsquo;s startup files e.g. in catalina.sh:\nexport JAVA_OPTS=\u0026#34;-d64 -Xmx4G\u0026#34; To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:\nThen we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in ldbc_spb_bm/dist/test.properties file.\nThe default value of datasetSize in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.\nYou need to change\ndatasetSize=1000000 Also the URLs of the SPARQL endpoint for the repository\nendpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1 endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.\nThese are the settings to do that, following parameters will \u0026lsquo;instruct\u0026rsquo; the SPB test driver to perform all the actions described above:\n#Benchmark Operational Phases loadOntologies=true loadReferenceDatasets=true generateCreativeWorks=true loadCreativeWorks=true generateQuerySubstitutionParameters=true validateQueryResults=false warmUp=false runBenchmark=false runBenchmarkOnlineReplicationAndBackup=false checkConformance=false To run the benchmark execute the following:\njava -jar semantic_publishing_benchmark-basic-standard.jar test.properties When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.\nNext we will measure the performance of Sesame Data Store by changing some configuration properties:\n#Benchmark Configuration Parameters warmupPeriodSeconds=60 benchmarkRunPeriodSeconds=300 ... #Benchmark Operational Phases loadOntologies=false loadReferenceDatasets=false generateCreativeWorks=false loadCreativeWorks=false generateQuerySubstitutionParameters=false validateQueryResults=false warmUp=true runBenchmark=true runBenchmarkOnlineReplicationAndBackup=false checkConformance=false After the benchmark test run has finished result files are saved in folder: dist/logs\nThere you will find three types of results: the result summary of the benchmark run (semantic_publishing_benchmark_results.log), brief results and detailed results.\nIn semantic_publishing_benchmark_results.log you will find the results distributed per seconds. They should be similar to the listing bellow:\nBenchmark Results for the 300-th second\nSeconds : 300 (completed query mixes : 0) Editorial: 2 agents 9 inserts (avg : 22484 ms, min : 115 ms, max : 81389 ms) 0 updates (avg : 0 ms, min : 0 ms, max : 0 ms) 0 deletes (avg : 0 ms, min : 0 ms, max : 0 ms) 9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors)) 0.0300 average operations per second Aggregation: 8 agents 2 Q1 queries (avg : 319 ms, min : 188 ms, max : 451 ms, 0 errors) 3 Q2 queries (avg : 550 ms, min : 256 ms, max : 937 ms, 0 errors) 1 Q3 queries (avg : 58380 ms, min : 58380 ms, max : 58380 ms, 0 errors) 2 Q4 queries (avg : 65250 ms, min : 40024 ms, max : 90476 ms, 0 errors) 1 Q5 queries (avg : 84220 ms, min : 84220 ms, max : 84220 ms, 0 errors) 2 Q6 queries (avg : 34620 ms, min : 24499 ms, max : 44741 ms, 0 errors) 3 Q7 queries (avg : 5892 ms, min : 4410 ms, max : 8528 ms, 0 errors) 2 Q8 queries (avg : 3537 ms, min : 546 ms, max : 6528 ms, 0 errors) 4 Q9 queries (avg : 148573 ms, min : 139078 ms, max : 169559 ms, 0 errors) This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.\nIf you have any troubles running the benchmark, don\u0026rsquo;t hesitate to comment or use our social media channels.\nIn a future post we will go through some of the parameters of SPB and check their performance implications.\n","permalink":"https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/","tags":["spb","sesame","rdf","tutorial","guide"],"title":"Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confwww-pham-peb-15/","tags":[],"title":"Deriving an Emergent Relational Schema from RDF Data"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalsws-loizou-ag-15/","tags":[],"title":"On the formulation of performant SPARQL queries"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-erling-alcgppb-15/","tags":[],"title":"The LDBC Social Network Benchmark: Interactive Workload"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-guisado-gamez-p-14/","tags":[],"title":"Understanding Graph Structure of Wikipedia for Query Expansion"},{"categories":null,"contents":"The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.\nThe SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:\nvalue-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation) The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:\ninstance (in)equality (owl:sameAs, owl:differentFrom) class and property equivalence (owl:equivalentClass, owl:equivalentProperty) class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties) class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf) property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty) complex class definitions (owl:unionOf, owl:intersectionOf) SPIMBench uses and extends the ontologies of LDBC\u0026rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB\u0026rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.\nValue and structure-based test cases are implemented using the SWING framework [1] on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.\nSPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.\nSPIMBench can be downloaded from our repository and a more thorough description thereof can be found on http://www.ics.forth.gr/isl/spimbench/.\nReferences [1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.\n","permalink":"https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/","tags":["instance matching","benchmark"],"title":"Semantic Publishing Instance Matching Benchmark"},{"categories":null,"contents":"We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.\nAs discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.\nThere are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.\nLet’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.\nOne of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.\nAnother feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.\nSince a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.\nAn orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.\nSo, let’s see how some of these aspects could be captured in the SNB context.\nGeography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.\nThe communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -\u0026gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.\nThe behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.\nIn John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”\nAnalytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.\nFrom a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.\nThis leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.\nThere is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.\n","permalink":"https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/","tags":["snb","bi"],"title":"Further Developments in SNB BI Workload"},{"categories":null,"contents":"LDBC\u0026rsquo;s Semantic Publishing Benchmark (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we wrote earlier, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.\nLately we tested different Amazon Web Services (AWS) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that GraphDB experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.\nThe Experiment For our tests we use:\nGraphDB Standard v6.1 LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows: 8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also 50M dataset (SF1) 40 minutes of benchmark run time (60 seconds of warm up) 5 different Amazon EC2 instances and one local server Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.\nWe use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.\nWe also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.\nThe Results For the tests we measured:\nqueries/s for the read threads, where queries include SELECT and CONSTRUCT updates/s for the write threads, where an update operation is INSERT or DELETE queries/$ and updates/$ – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput update/vCPU – modification operations per vCPU per second Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.\nThe improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.\nTable 1. SPB Measurement Results on AWS and Local Servers\nServer Type vCPUs R/W Agents RAM (GB) \u0026ldquo;Storage (GB, SSD)\u0026rdquo; Price USD/h Queries/ sec. Updates/ sec. Queries/ USD Updates/ USD Updates/ vCPU m3.xlarge 4 8/2 15 2x 40 0.28 8.39 8.23 107 882 105 873 2.06 m3.2xlarge 8 8/2 30 2x 80 0.56 15.44 15.67 99 282 100 752 1.96 c3.xlarge 4 8/2 7.5 2x 40 0.21 7.17 6.78 122 890 116 292 1.7 c3.2xlarge 8 8/2 15 2x 80 0.42 16.46 14.56 141 107 124 839 1.82 c3.4xlarge 16 8/2 30 2x 160 0.84 23.23 21.17 99 578 90 736 1.32 c3.4xlarge 16 8/3 30 2x 160 0.84 22.89 20.39 98 100 87 386 1.27 c3.4xlarge 16 10/2 30 2x 160 0.84 26.6 19.11 114 000 81 900 1.19 c3.4xlarge 16 10/3 30 2x 160 0.84 26.19 19.18 112 243 82 200 1.2 c3.4xlarge 16 14/2 30 2x 160 0.84 30.84 16.88 132 171 72 343 1.06 c3.4xlarge 16 14/3 30 2x 160 0.84 29.67 17.8 127 157 76 286 1.11 Local 32 8/2 256 8x 256 0.85 37.11 32.04 156 712 135 302 1 Local 32 8/3 256 8x 256 0.85 37.31 32.07 157 557 135 429 1 Local 32 10/2 256 8x 256 0.85 40 31.01 168 916 130 952 0.97 Local 32 14/2 256 8x 256 0.85 36.39 26.42 153 672 111 569 0.83 Local 32 14/3 256 8x 256 0.85 36.22 26.39 152 954 111 443 0.82 Local 32 20/2 256 8x 256 0.85 34.59 23.86 146 070 100 759 0.75 The Optimal Number of Test Agents Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:\nThere is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads; Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17); Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations; For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server; Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization. There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates. Efficiency and Cost AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.\nCloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.\n$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!\nThe full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.\nTo put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:\n100 queries/sec. handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events. 10 updates/sec. - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour. $81/day is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times. ","permalink":"https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/","tags":["spb","amazon","ec2","aws","rdf"],"title":"Sizing AWS Instances for the Semantic Publishing Benchmark"},{"categories":null,"contents":"In previous posts (Getting started with snb, DATAGEN: data generation for the Social Network Benchmark), Arnau Prat discussed the main features and characteristics of DATAGEN: realism, scalability, determinism, usability. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the instructions for generating a SNB dataset and for loading the dataset into Virtuoso. In the following sections, we analyze several aspects of the generated dataset.\nA Realistic social graph One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about Facebook Anatomy). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook\u0026rsquo;s graph distribution.\nFigure 1: Cumulative distribution #friends per user\n#R script for generating the social degree distribution #Input files: person_knows_person_*.csv library(data.table) library(igraph) library(plotrix) require(bit64) dflist \u0026lt;- lapply(commandArgs(trailingOnly = TRUE), fread, sep=\u0026#34;|\u0026#34;, header=T, select=1:2, colClasses=\u0026#34;integer64\u0026#34;) df \u0026lt;- rbindlist(dflist) setNames(df, c(\u0026#34;P1\u0026#34;, \u0026#34;P2\u0026#34;)) d2 \u0026lt;- df[,length(P2),by=P1] pdf(\u0026#34;socialdegreedist.pdf\u0026#34;) plot(ecdf(d2$V1),main=\u0026#34;Cummulative distribution #friends per user\u0026#34;, xlab=\u0026#34;Number of friends\u0026#34;, ylab=\u0026#34;Percentage number of users\u0026#34;, log=\u0026#34;x\u0026#34;, xlim=c(0.8, max(d2$V1) + 20)) dev.off() Data Correlations Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.\nWhich are the most popular names of a country?\nWe run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, \u0026lsquo;A_country_name\u0026rsquo; is the name of a particular country such as \u0026lsquo;Germany\u0026rsquo;, \u0026lsquo;Netherlands\u0026rsquo;, or \u0026lsquo;Vietnam\u0026rsquo;.\nSELECT p_lastname, count (p_lastname) as namecnt FROM person, country WHERE p_placeid = ctry_city and ctry_name = \u0026#39;A_country_name\u0026#39; GROUP BY p_lastname order by namecnt desc; As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as Muller is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam. We note that the names\u0026rsquo; distribution may not be exactly the same as the contemporary names\u0026rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.\nFigure 2. Distribution of names in Germany\nFigure 3. Distribution of names in Netherlands\nFigure 4. Distribution of names in Vietnam\nWhere my friends are living?\nWe run the following query, which computes the locations of the friends of people living in China.\nSELECT top 10 fctry.ctry_name, count (*) from person self, person friend, country pctry, knows, country fctry WHERE pctry.ctry_name = \u0026#39;China\u0026#39; and self.p_placeid = pctry.ctry_city and k_person1id = self.p_personid and friend.p_personid = k_person2id and fctry.ctry_city = friend.p_placeid GROUP BY fctry.ctry_name ORDER BY 2 desc; As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.\nFigure 5. Locations of friends of people in China\nWhere my friends are studying?\nFinally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.\nSELECT top 10 o2.o_name, count(o2.o_name) from knows, person_university p1, person_university p2, organisation o1, organisation o2 WHERE p1.pu_organisationid = o1.o_organisationid and o1.o_name=\u0026#39;Hangzhou_International_School\u0026#39; and k_person1id = p1.pu_personid and p2.pu_personid = k_person2id and p2.pu_organisationid = o2.o_organisationid GROUP BY o2.o_name ORDER BY 2 desc; As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).\nFigure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.\nName # of friends Hangzhou_International_School 12696 Anhui_University_of_Science_and_Technology 4071 China_Jiliang_University 3519 \u0026hellip; Darmstadt_University_of_Applied_Sciences 1 Calcutta_School_of_Tropical_Medicine 1 Chettinad_Vidyashram 1 Women\u0026rsquo;s_College_Shillong 1 Universitas_Nasional 1 Table 1. Universities where friends of Hangzhou International School students are studying at.\nIn a real social network, data is riddled with many more correlations; it is a true data mining task to extract these. Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.\n","permalink":"https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/","tags":["developer","industry"],"title":"DATAGEN: a Realistic Social Network Data Generator"},{"categories":null,"contents":"In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: https://github.com/ldbc/ldbc_driver/. Multiple reference implementations by two vendors are available here: https://github.com/ldbc/ldbc_snb_implementations, and discussion of the schema, data properties, and related content is available here: https://github.com/ldbc/ldbc_snb_docs.\nThe following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.\nProblem Description The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person\u0026rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.\nConsider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.\nThe next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.\n","permalink":"https://ldbcouncil.org/post/snb-driver-part-1/","tags":["snb","driver","tpc-c","interactive"],"title":"SNB Driver - Part 1"},{"categories":null,"contents":"LDBC SPB (Semantic Publishing Benchmark) is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC\u0026rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an Ontotext Graph DB deployment. Graph DB was formerly known as Owlim.\nSo, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.\nSPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:\nSome queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.\nSome queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.\nThese different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.\nAnother guiding factor of SPB was the BBC\u0026rsquo;s and others\u0026rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.\nNormally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:\nUpdates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.\nShort queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.\nAnalytics - These cover a large fraction of the dataset and are roughly linear to data size.\nA test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.\nThe benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:\n46886 MB of RDF literal text\n23924 MB of full text index for RDF literals\n23598 MB of URI strings\n21981 MB of quads, stored column-wise with default index scheme\nClearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.\nLet\u0026rsquo;s now look at a full run at unit scale, i.e. 50M triples.\nThe run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.\nThe interactive driver reports:\nSeconds run : 2144 Editorial: 2 agents 68164 inserts (avg : 46 ms, min : 5 ms, max : 3002 ms) 8440 updates (avg : 72 ms, min : 15 ms, max : 2471 ms) 8539 deletes (avg : 37 ms, min : 4 ms, max : 2531 ms) 85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors)) 39.7122 average operations per second Aggregation: 20 agents 4120 Q1 queries (avg : 789 ms, min : 197 ms, max : 6767 ms, 0 errors) 4121 Q2 queries (avg : 85 ms, min : 26 ms, max : 3058 ms, 0 errors) 4124 Q3 queries (avg : 67 ms, min : 5 ms, max : 3031 ms, 0 errors) 4118 Q5 queries (avg : 354 ms, min : 3 ms, max : 8172 ms, 0 errors) 4117 Q8 queries (avg : 975 ms, min : 25 ms, max : 7368 ms, 0 errors) 4119 Q11 queries (avg : 221 ms, min : 75 ms, max : 3129 ms, 0 errors) 4122 Q12 queries (avg : 131 ms, min : 45 ms, max : 1130 ms, 0 errors) 4115 Q17 queries (avg : 5321 ms, min : 35 ms, max : 13144 ms, 0 errors) 4119 Q18 queries (avg : 987 ms, min : 138 ms, max : 6738 ms, 0 errors) 4121 Q24 queries (avg : 917 ms, min : 33 ms, max : 3653 ms, 0 errors) 4122 Q25 queries (avg : 451 ms, min : 70 ms, max : 3695 ms, 0 errors) 22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ] 45318 total retrieval queries (0 timed-out) 22.5239 average queries per second The analytical driver reports:\nAggregation: 2 agents 14 Q4 queries (avg : 9984 ms, min : 4832 ms, max : 17957 ms, 0 errors) 12 Q6 queries (avg : 4173 ms, min : 46 ms, max : 7843 ms, 0 errors) 13 Q7 queries (avg : 1855 ms, min : 1295 ms, max : 2415 ms, 0 errors) 13 Q9 queries (avg : 561 ms, min : 446 ms, max : 662 ms, 0 errors) 14 Q10 queries (avg : 2641 ms, min : 1652 ms, max : 4238 ms, 0 errors) 12 Q13 queries (avg : 595 ms, min : 373 ms, max : 1167 ms, 0 errors) 12 Q14 queries (avg : 65362 ms, min : 6127 ms, max : 136346 ms, 2 errors) 13 Q15 queries (avg : 45737 ms, min : 12698 ms, max : 59935 ms, 0 errors) 13 Q16 queries (avg : 30939 ms, min : 10224 ms, max : 38161 ms, 0 errors) 13 Q19 queries (avg : 310 ms, min : 26 ms, max : 1733 ms, 0 errors) 12 Q20 queries (avg : 13821 ms, min : 11092 ms, max : 15435 ms, 0 errors) 13 Q21 queries (avg : 36611 ms, min : 14164 ms, max : 70954 ms, 0 errors) 13 Q22 queries (avg : 42048 ms, min : 7106 ms, max : 74296 ms, 0 errors) 13 Q23 queries (avg : 48474 ms, min : 18574 ms, max : 93656 ms, 0 errors) 0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ] 180 total retrieval queries (2 timed-out) 0.0862 average queries per second The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)\nThe SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (v7fasttrack at github.com, feature/analytics).\nThe minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.\nIs this good or bad? I would say that this is possible but better can certainly be accomplished.\nThe initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.\nAs an initial comment of the workload mix, I\u0026rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.\nAdjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.\nIn the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.\n","permalink":"https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/","tags":["spb","test run"],"title":"Making Semantic Publishing Execution Rules"},{"categories":null,"contents":"The LDBC consortium are pleased to announce its fifth Technical User\nCommunity (TUC) meeting.\nThis will be a one-day event at the National Hellenic Research Institute\nin Athens, Greece on Friday November 14, 2014.\nAgenda 10:30 - 11:00 Coffee Break\n11:00 - 11:10 Peter Boncz (VUA) Welcome \u0026amp; LDBC project status update (Presentation)\n11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status\nFeedback \u0026amp; Roadmap for SPB \u0026amp; OWLIM (Presentation)\n11:25 - 11:30 Orri Erling (OGL) Status, Feedback \u0026amp; Roadmap for SPB \u0026amp; Virtuoso (Presentation)\n11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and Status, Feedback \u0026amp; Roadmap for SNB \u0026amp; Neo4J (Presentation)\n11:45 - 12:00 Orri Erling (OGL) Status, Feedback \u0026amp; Roadmap for SNB \u0026amp; Virtuoso (Presentation)\n12:00 - 12:20 Arnau Prat (UPC) \u0026amp; Andrey Gubichev Status, Feedback \u0026amp; Roadmap for SNB Interactive \u0026amp; Sparksee (Presentation ) and Business Intelligence (Presentation)\n12:20 - 12:40 Tomer Sagi, \u0026ldquo;Experience with SNB and TitanDB at HP\u0026rdquo; (Presentation )\n12:40 - 13:00 Jakob Nelson, \u0026ldquo;graphbench.org on the SNB datagen\u0026rdquo;\n13:00 - 14:30 Lunch Break@Byzantine \u0026amp; Christian Museum (link)\n14:30 - 14:50 Olaf Hartig, \u0026ldquo;Integrating the Property Graph and RDF data models\u0026rdquo; (Presentation)\\\nDocuments: arxiv/1409.3288, arxiv/1406.3399\n14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, \u0026ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines\u0026rdquo; (Presentation)\n15:10 - 15:30 Evaggelia Pitoura, \u0026ldquo;Historical Queries on Graphs\u0026rdquo; (Presentation)\n15:30 - 16:00 Coffee Break\n16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, \u0026ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases\u0026rdquo; (Presentation)\n16:20 - 16:40 Gunes Aluc, \u0026ldquo;WatDiv: How to Tune-up your RDF Data Management System\u0026rdquo; (Presentation)\n16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, \u0026ldquo;Benchmarking @LogicBlox\u0026rdquo; (Presentation)\n17:00 - 17:15 Hassan Chafi, \u0026ldquo;Oracle Labs Graph Strategy\u0026rdquo;\n17:15 - 17:25 Yinglong Xia, \u0026ldquo;Property Graphs for Industry Solution at IBM\u0026rdquo; (Presentation)\n17:25 - 17:30 Arthur Keen, \u0026ldquo;Short Introduction to SPARQLcity\u0026rdquo;\n20:30 Dinner @ Konservokouti (link)\nGet a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion\nLogistics The meeting will be held at the National Hellenic Research Foundation located in downtown Athens.\nTravel Athens, Greece\u0026rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.\nTo arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).\nYou can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: http://www.aia.gr/traveler/\n","permalink":"https://ldbcouncil.org/event/fifth-tuc-meeting/","tags":["TUC Meeting"],"title":"Fifth TUC Meeting"},{"categories":null,"contents":"The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.\nThe benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:\nclustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time) correlations between entities - there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time) The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.\nCurrently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit, regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:\njoin ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema subselects that aggregate the query results that the optimiser should recognise and evaluate first optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.) unions to be executed in parallel optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results handling of geo-spatial predicates full-text search optimisation asynchronous execution of the aggregate sub-queries use of distinct to choose the optimal query plan We give below Query 1 of the Semantic Publishing Benchmark.\nPREFIX bbcevent:\u0026lt;http://www.bbc.co.uk/ontologies/event/\u0026gt; PREFIX geo-pos:\u0026lt;http://www.w3.org/2003/01/geo/wgs84_pos#\u0026gt; PREFIX bbc:\u0026lt;http://www.bbc.co.uk/ontologies/bbc/\u0026gt; PREFIX time:\u0026lt;http://www.w3.org/2006/time#\u0026gt; PREFIX event:\u0026lt;http://purl.org/NET/c4dm/event.owl#\u0026gt; PREFIX music-ont:\u0026lt;http://purl.org/ontology/mo/\u0026gt; PREFIX rdf:\u0026lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#\u0026gt; PREFIX foaf:\u0026lt;http://xmlns.com/foaf/0.1/\u0026gt; PREFIX provenance:\u0026lt;http://www.bbc.co.uk/ontologies/provenance/\u0026gt; PREFIX owl:\u0026lt;http://www.w3.org/2002/07/owl#\u0026gt; PREFIX cms:\u0026lt;http://www.bbc.co.uk/ontologies/cms/\u0026gt; PREFIX news:\u0026lt;http://www.bbc.co.uk/ontologies/news/\u0026gt; PREFIX cnews:\u0026lt;http://www.bbc.co.uk/ontologies/news/cnews/\u0026gt; PREFIX cconcepts:\u0026lt;http://www.bbc.co.uk/ontologies/coreconcepts/\u0026gt; PREFIX dbp-prop:\u0026lt;http://dbpedia.org/property/\u0026gt; PREFIX geonames:\u0026lt;http://sws.geonames.org/\u0026gt; PREFIX rdfs:\u0026lt;http://www.w3.org/2000/01/rdf-schema#\u0026gt; PREFIX domain:\u0026lt;http://www.bbc.co.uk/ontologies/domain/\u0026gt; PREFIX dbpedia:\u0026lt;http://dbpedia.org/resource/\u0026gt; PREFIX geo-ont:\u0026lt;http://www.geonames.org/ontology#\u0026gt; PREFIX bbc-pont:\u0026lt;http://purl.org/ontology/po/\u0026gt; PREFIX tagging:\u0026lt;http://www.bbc.co.uk/ontologies/tagging/\u0026gt; PREFIX sport:\u0026lt;http://www.bbc.co.uk/ontologies/sport/\u0026gt; PREFIX skosCore:\u0026lt;http://www.w3.org/2004/02/skos/core#\u0026gt; PREFIX dbp-ont:\u0026lt;http://dbpedia.org/ontology/\u0026gt; PREFIX xsd:\u0026lt;http://www.w3.org/2001/XMLSchema#\u0026gt; PREFIX core:\u0026lt;http://www.bbc.co.uk/ontologies/coreconcepts/\u0026gt; PREFIX curric:\u0026lt;http://www.bbc.co.uk/ontologies/curriculum/\u0026gt; PREFIX skos:\u0026lt;http://www.w3.org/2004/02/skos/core#\u0026gt; PREFIX cwork:\u0026lt;http://www.bbc.co.uk/ontologies/creativework/\u0026gt; PREFIX fb:\u0026lt;http://rdf.freebase.com/ns/\u0026gt; # Query Name : query1 # Query Description : # Retrieve creative works about thing t (or that mention t) # reasoning: rdfs:subClassOf, rdf:type # join ordering: cwork:dateModified rdf:type owl:FunctionalProperty # join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty # Choke Points : # - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified # Optimizer should use an efficient cost evaluation method for choosing the optimal join tree # - A sub-select which aggregates results. Optimizer should recognize it and execute it first # - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries) # Optimizer should decide to put optional triples on top of the join tree # (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join # - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork # and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​ CONSTRUCT { ?creativeWork a cwork:CreativeWork ; a ?type ; cwork:title ?title ; cwork:shortTitle ?shortTitle ; cwork:about ?about ; cwork:mentions ?mentions ; cwork:dateCreated ?created ; cwork:dateModified ?modified ; cwork:description ?description ; cwork:primaryFormat ?primaryFormat ; bbc:primaryContentOf ?webDocument . ?webDocument bbc:webDocumentType ?webDocType . ?about rdfs:label ?aboutLabel ; bbc:shortLabel ?aboutShortLabel ; bbc:preferredLabel ?aboutPreferredLabel . ?mentions rdfs:label ?mentionsLabel ; bbc:shortLabel ?mentionsShortLabel ; bbc:preferredLabel ?mentionsPreferredLabel . ?creativeWork cwork:thumbnail ?thumbnail . ?thumbnail a cwork:Thumbnail ; cwork:altText ?thumbnailAltText ; cwork:thumbnailType ?thumbnailType . } WHERE { { SELECT ?creativeWork WHERE { ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} . ?creativeWork a cwork:CreativeWork ; cwork:dateModified ?modified . } ORDER BY DESC(?modified) LIMIT 10 } ?creativeWork a cwork:CreativeWork ; a ?type ; cwork:title ?title ; cwork:dateModified ?modified . OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . } OPTIONAL { ?creativeWork cwork:description ?description . } OPTIONAL { ?creativeWork cwork:about ?about . OPTIONAL { ?about rdfs:label ?aboutLabel . } OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . } OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . } } OPTIONAL { ?creativeWork cwork:mentions ?mentions . OPTIONAL { ?mentions rdfs:label ?mentionsLabel . } OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . } OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . } } OPTIONAL { ?creativeWork cwork:dateCreated ?created . } OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . } OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork . OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . } } OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument . OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . } } OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail . OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . } OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . } } } Listing 1. Semantic Publishing Benchmark: Query 1\nThe benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.\nThe data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded. Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.\nThe generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c) the benchmark results (semantic_publishing_benchmark_results.log ).\nBelow we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.\nSeconds run : 600 Editorial: 0 agents 0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions) 0.0000 average operations per second Aggregation: 8 agents 298 Q1 queries 267 Q2 queries 243 Q3 queries 291 Q4 queries 320 Q5 queries 286 Q6 queries 255 Q7 queries 274 Q8 queries 271 Q9 queries 2505 total retrieval queries 4.1750 average queries per second Listing 2. A snippet of semantic_publishing_benchmark_results.log\nWe run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE, Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:\n#triples Q1 Q2 Q3 Q4 Q5 Q6 Q7 Q8 Q9 #queries avg. #q. per sec. 10M 298 267 243 291 320 286 255 274 271 2505 41,750 100M 53 62 51 52 44 62 25 55 45 449 7,483 1B 34 29 22 24 25 29 0 29 28 220 3,667 ","permalink":"https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/","tags":["spb","sparql"],"title":"Getting Started With the Semantic Publishing Benchmark"},{"categories":null,"contents":"The Linked Data Benchmark Council (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its https://ldbcouncil.org website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (next TUC meeting will be on October 5 in Athens) and indeed in designing benchmarks.\nSo, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by TPC have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are relevant and representative (address important challenges encountered in practice), understandable , economical (implementable on simple hardware), fair (such as not to favor a particular product or approach), scalable, accepted by the community and public (e.g. all of its software is available in open source). This list stems from Jim Gray\u0026rsquo;s Benchmark Handbook. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.\nA very important aspect of benchmark development is making sure that the community accepts a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on fairness had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design. LDBC has spent a lot of time engaging interested parties (mainly through its Technical User Community gatherings) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.\nThe need for understandability for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the Social Network Benchmark (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.\nThe economical aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.\nRepresentative benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the DBpedia benchmark whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).\nThe fact that a benchmark can be scaled in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age, data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N)) \u0026ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.\nNow, what makes a benchmark relevant? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of \u0026ldquo;choke points\u0026rdquo;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.\nTo illustrate what choke points are in more depth, we wrote a paper in the TPCTC 2013 conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. This table lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):\nI would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise). Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H: Top-N pushdown. In a detailed blog entry, Orri shows how this technique can trivialize Q18; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.\nLDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark (SPB) and the more graph-focused Social Network Benchmark (SNB), and tell us what you think. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.\n(for more posts from Peter Boncz, see also Database Architects, a blog about data management challenges and techniques written by people who design and implement database systems)\n","permalink":"https://ldbcouncil.org/post/choke-point-based-benchmark-design/","tags":["database","benchmark","design"],"title":"Choke Point Based Benchmark Design"},{"categories":null,"contents":"The Linked Data Benchmark Council (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.\nThe Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth Technical User Community meeting. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.\nYou can also see that we created a this new website and a new logo. This website is different from http://ldbc.eu that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.\nIn the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.\n","permalink":"https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/","tags":["developer","industry"],"title":"New Website Online LDBC Benchmarks Reach Public Draft"},{"categories":null,"contents":"Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.\nFrom a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.\nWith the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, SNB, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.\nThe SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the LDBC Github repository. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the ACM SIGMOD programming contest 2014.\nThe SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.\nMore details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.\n","permalink":"https://ldbcouncil.org/post/social-network-benchmark-goals/","tags":["snb","datagen","interactive","bi","graphalytics"],"title":"Social Network Benchmark Goals"},{"categories":null,"contents":"It is with great pleasure that we announce the new LDBC organisation site at www.ldbcouncil.org. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the benchmarks menu on this site.\nThose benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.\nWhile the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.\nWe want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.\nFinally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.\nIn all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.\n","permalink":"https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/","tags":["ldbc"],"title":"Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies"},{"categories":null,"contents":"Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.\nMore at: http://events.sti2.at/bersys2014/\n","permalink":"https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/","tags":["workshop","cfp","benchmark","bersys"],"title":"2nd International Workshop on Benchmarking RDF Systems"},{"categories":null,"contents":"As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 [1].\nOne of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.\nFor these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:\nRealism. The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook [2]. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated. Scalability. Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters. Determinism. DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible. Usability. LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible. Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (https://github.com/ldbc/ldbc_snb_datagen).\nReferences [1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. \u0026ldquo;S3g2: A scalable structure-correlated social graph generator.\u0026rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.\n[2] Prat-Pérez, Arnau, and David Dominguez-Sal. \u0026ldquo;How community-like is the structure of synthetically generated graphs?.\u0026rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.\n","permalink":"https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/","tags":["datagen","social network","snb"],"title":"DATAGEN: Data Generation for the Social Network Benchmark"},{"categories":null,"contents":"In a previous blog post titled \u0026ldquo;Is SNB like Facebook\u0026rsquo;s LinkBench?\u0026rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.\nDATAGEN DATAGEN is the data generator used by all the workloads of SNB. Here we introduced the design goals that drive the development of DATAGEN, which can be summarized as: Realism, Scalability, Determinism and Usability.\nDATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.\nFor the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:\nRealistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.\nCorrelated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.\nDATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.\nFinally, DATAGEN outputs two other things:\nUpdate Streams, which will be used in the future to implement updates in the workloads.\nSubstitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.\nConfiguring and using DATAGEN is easy. Please visit this page for more information.\nLDBC driver SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.\nIt is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation page.\nThe test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.\nGiven a workload consisting of a series of Operations, the test sponsor implements OperationHandlers __ for them. OperationHandlers are responsible of executing instances of an specific operation (query) type. This is done by overriding the method executeOperation(), which receives as input parameter an Operation instance and returns the result. From Operation __ instance, the operation\u0026rsquo;s input parameters can be retrieved, as well as the database connection state.\nThe database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the Db interface, which consists of three methods: onInit(), onCleanup() and getConnectionState(). onInit() is called before the benchmark is executed, and is responsible of initializing the database and registering the different OperationHandlers. onCleanup() is called after the benchmark has completed. Any resources that need to be released should be released here.\nFinally, getConnectionState() returns an instance of DbConnectionState, which encapsulates any state that needs to be shared between OperationHandler instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.\nA good example on how to implement the benchmark can be found here.\nWorkloads Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.\nInteractive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.\nBusiness Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.\nExamples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.\nFinally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.\nFinal remarks This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification draft, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.\n","permalink":"https://ldbcouncil.org/post/getting-started-with-snb/","tags":["snb","interactive","datagen"],"title":"Getting Started With SNB"},{"categories":null,"contents":"The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.\nThe benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user\u0026rsquo;s social environment and potentially access data associated with the friends or a user and their friends.\nThis is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.\nSNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.\nThe challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.\nThe dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.\nThe metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices. The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the selected scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.\nDifferent technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API\u0026rsquo;s.\nSNB Interactive is an example of LDBC\u0026rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art\nThe benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.\nSubsequent posts will address the workload in more detail.\n","permalink":"https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/","tags":["snb","interactive"],"title":"Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload"},{"categories":null,"contents":"In this post, I will discuss in some detail the rationale and goals of the design of the Social Network Benchmark (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook\u0026rsquo;s own graph benchmark called LinkBench. We think SNB is the most intricate graph database benchmark to date (it\u0026rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference SIGMOD in Snowbird after being used for this year\u0026rsquo;s ACM SIGMOD Programming Contest, which was about graph analytics.\nSNB is intended to provide the following value to different stakeholders:\nFor end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to compare merits of different products and technologies. By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.\nFor vendors of graph database technology, SNB provides a checklist of features and performance characteristics that helps in product positioning and can serve to guide new development.\nFor researchers, both industrial and academic, the SNB dataset and workload provide interesting challenges in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.\nI should clarify that even though the data model of SNB resembles Facebook (and we\u0026rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don\u0026rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the connection patterns between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:\nthe benchmark scenario should be understandable to a large audience, and this audience should also understand the relevance of managing such data.\nthe scenario in the benchmark should cover the complete range of challenges relevant for graph data management, according to the benchmark scope.\nthe query challenges in it should be realistic in the sense that, though synthetic, similar data and workloads are encountered in practice.\nThe SNB is in fact three distinct benchmarks with a common dataset, since there are three different workloads. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale. The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.\nInteractive Workload. The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j\u0026rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system\u0026rsquo;s throughput with relatively simple queries with concurrent updates. The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times. Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags. Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction. Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the data generator and driver software stack are ready and the purpose is to obtain user feedback, as well as develop good system implementations. The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.\nBusiness Intelligence Workload. There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes. The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read. The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.\nGraph Analytics Workload. This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation. The analysis itself produces large intermediate results. The analysis is not expected to be transactional or to have isolation from possible concurrent updates.\nAll the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art data generator. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to LinkBench, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the low-level MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that Facebook\u0026rsquo;s IT infrastructure does not store all user data in MySQL and its modified memcached (\u0026quot;TAO\u0026quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it does matter how people are connected, and how the attribute values of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with correlations, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a \u0026ldquo;choke point\u0026rdquo; for graph data management system where LDBC wants to stimulate innovation).\n","permalink":"https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/","tags":["developer","snb","interactive","bi","graphalytics"],"title":"Is SNB Like Facebooks LinkBench"},{"categories":null,"contents":"Synopsis: Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.\nIt is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.\nAs part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.\nNow, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.\nSo, LDBC SNB has a twofold task:\nIn order to be a credible interactive workload, it must in fact have characteristics of one In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics. Designing a workload presents specific challenges:\nThe workload must be realistic enough for users to identify with it. The workload must pose challenges and drive innovation in a useful direction. The component operations must all play a noticeable role in it. If the operation\u0026rsquo;s relative performance doe does not affect the score, why is it in the workload? The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.\nVery roughly, the choke points (technical challenges) of SNB interactive are as follows:\nRandom access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored. Query optmization must produce right plans - The primary point isjoin order and join type. Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join. When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations. Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities. Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.\nIn online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.\nA key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.\nThe other aspect is the metric, typically some variation on operations per unit of time.\nAll these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.\nSo how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.\nBut SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference. For now, it is SQL and all we want is transparency into the metal.\nHaving this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time. For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected. Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:\nShort queries should collectively be about 45% of the CPU load. Updates will be under 5% Long queries will take up the rest. For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others. The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation. Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.\nThere is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries. To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.\nIn the next post we will look at the actual mix and execution times on the test system.\n","permalink":"https://ldbcouncil.org/post/making-it-interactive/","tags":["snb","benchmarking","tpc","sparql","interactive"],"title":"Making It Interactive"},{"categories":null,"contents":"In previous posts (this and this) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development, the instructions given in this tutorial might change in the future.\nGetting and Configuring Hadoop DATAGEN runs on top of hadoop 1.2.1 to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:\n$ cd /home/user $ tar xvfz hadoop-1.2.1.tar.gz For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the LDBC DATAGEN wiki.\nGetting and configuring DATAGEN Before downloading DATAGEN, be sure to fulfill the following requirements:\nLinux based machine java 1.6 or greater python 2.7.X maven 3 After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found here. Again, decompress the downloaded file with the following commands:\n$ cd /home/user $ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz This will create a folder called “ldbc_snb_datagen-0.1.2”.\nDATAGEN provides a run.sh is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.\nHADOOP_HOME=/home/user/hadoop-1.2.1 LDBC_SNB_DATAGEN_HOME=/home/user/ldbc_snb_datagen HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute run.sh script to compile and execute DATAGEN using default parameters. Type the following commands:\n$ cd /home/user/ldbc_snb_datagen-0.1.2 $ ./run.sh This will run DATAGEN, and two folders will be created at the same directory: social_network containing the scale factor 1 dataset with csv uncompressed files, and substitution_parameters containing the substituion parameters needed by the driver to execute the benchmark.\nChanging the generated dataset The characteristics of the dataset to be generated are specified in the params.ini file. By default, this file has the following content:\nscaleFactor:1 compressed:false serializer:csv numThreads:1 The following is the list of options and their default values supported by DATAGEN:\nOption Default value Description scaleFactor 1 \u0026ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000\u0026rdquo; serializer csv \u0026ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl\u0026rdquo; compressed FALSE Specifies to compress the output data in gzip. outputDir ./ Specifies the folder to output the data. updateStreams FALSE \u0026ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static\u0026rdquo; numThreads 1 Sets the number of threads to use. Only works for pseudo-distributed mode For instance, a possible params.ini file could be the following:\nscaleFactor:30 serializer:ttl compressed:true updateStreams:false outputDir:/home/user/output numThreads:4 For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):\nOption Default value Description numPersons - The number of persons to generate numYears - The amount of years of activity startYear - The start year of simulation. The following is an example of another possible params.ini file\nnumPersons:100000 numYears:3 startYear:2010 serializer:csv_merge_foreign compressed:false updateStreams:true outputDir:/home/user/output numThreads:4 For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at GitHub!\n","permalink":"https://ldbcouncil.org/post/snb-data-generator-getting-started/","tags":["datagen","snb","social network"],"title":"SNB Data Generator - Getting Started"},{"categories":null,"contents":"Note: consider this post as a continuation of the \u0026ldquo;Making it interactive\u0026rdquo; post by Orri Erling.\nI have now completed the Virtuoso TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. TPC-H is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.\nSo, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.\nThe BI part is like TPC-H, except for adding the following challenges:\nJoins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.\nTransitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.\nTransitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.\nGraph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.\nRunning one query with parameters from different buckets, implying different best plan.\nData correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.\nLarge intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.\nMore unions and outer joins.\nThe idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.\nFor rules and metric, we can use the TPC-H or TPC-DS ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and Open Street Map. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.\nDoing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.\nAs a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or \u0026ldquo;Platonic\u0026rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.\nSo, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.\nThe distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.\nThis brings us to the graph analytics proper, which is often done in BSP style, e.g. Pregel, Giraph, Signal-Collect, some but not all Green-Marl applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.\nWith BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as graphbench.org but will be adapted to the SNB dataset.\nThe analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.\n","permalink":"https://ldbcouncil.org/post/the-day-of-graph-analytics/","tags":["analytics","snb"],"title":"The Day of Graph Analytics"},{"categories":null,"contents":"During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC Semantic Publishing Benchmark (LDBC-SPB) as a part of our development and release process.\nFirst thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.\nInitially we’ve decided to fix some of the benchmark parameters :\nthe dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively. * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run. Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.\nWe’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.\nFollowing two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.\nFigure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.\nFigure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.\nAnother thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark\u0026rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.\nAn additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called checkConformance. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.\n","permalink":"https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/","tags":["ldbc","spb","rdf"],"title":"Using LDBC SPB to Find OWLIM Performance Issues"},{"categories":null,"contents":"The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.\nThis will be a one-day event at CWI in Amsterdam on Thursday April 3, 2014.\nThe event will include:\nIntroduction to the objectives and progress of the LDBC project. Description of the progress of the benchmarks being evolved through Task Forces. Users explaining their use-cases and describing the limitations they have found in current technology. Industry discussions on the contents of the benchmarks. All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu\nFor presenters please limit your talks to just 15 minutes\nAgenda April 3rd\n10:00 Peter Boncz (VUA) – pptx, video: LDBC project status update\n10:20 Norbert Martinez (UPC) – pdf, video: Status update on the LDBC Social Network Benchmark (SNB) task force.\n10:50 Alexandru Iosup (TU Delft) – ppt, video: Towards Benchmarking Graph-Processing Platforms\n11:10 Mike Bryant (Kings College) – pptx, video: EHRI Project: Archival Integration with Neo4j\n11:30 coffee\n11:50 Thilo Muth (University of Magdeburg) – pptx, video: MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis\n12:10 Davy Suvee (Janssen Pharmaceutica / Johnson \u0026amp; Johnson) – video: Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph\n12:30 Yongming Luo (TU Eindhoven) – pdf, video: Regularities and dynamics in bisimulation reductions of big graphs\n12:50 Christopher Davis (TU Delft) – pdf, video: Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues\n13:10 - 14:30 lunch @ restaurant Polder\n14:30 SPB task force report\n15:00 Bastiaan Bijl (Sysunite) – pdf, video: Using a semantic approach for monitoring applications in large engineering projects\n15:20 Frans Knibbe (Geodan) – pptx, video: Benchmarks for geographical data\n15:40 Armando Stellato (University of Rome, Tor Vergata \u0026amp; UN Food and Agriculture Organization) – pptx, video: VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges\n16:00 coffee\n16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), video:Customer experiences in implementing SKOS-based vocabularymanagement systems\n16:40 Simon Jupp (European Bioinformatics Institute) – pdf, video: [Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]\n17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – pdf, video: Breakmarking UniProt RDF. SPARQL queries that make your database cry\u0026hellip;\n17:20 Rein van \u0026rsquo;t Veer (Digital Heritage Netherlands) – pptx, video Time and space for heritage\n17:40 end of meeting\n19:00 - 21:30 Social Dinner in restaurant Boom\nApril 4th\nLDBC plenary meeting for project partners.\nBenchmarking Graph-Processing Platforms: A Vision – Alexandru Iosup Logistics The meeting will be held at the Dutch national research institute for computer science and mathematics (CWI - Centrum voor Wiskunde en Informatica). It is located at Amsterdam Science Park:\n(A5 map)\nTravel Arriving \u0026amp; departing:\nAmsterdam has a well-functioning and nearby airport called Schiphol (AMS, www.schiphol.nl) that serves all main European carriers and also very many low-fare carriers.\nhttp://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane\nTrains (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) \u0026ndash; which station you are also likely arriving at in case of an international train trip.\nFrom the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI. If you go from the Centraal Station to one of the hotels, you should take tram 9 \u0026ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).\nTaxi is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).\nPublic transportation (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.\nOnly the \u0026ldquo;disposable\u0026rdquo; cards are interesting for you as visitor.\nMulti-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.\nGetting Around: the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.\nCars\nIn case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the \u0026ldquo;WCW\u0026rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.\nArriving at CWI: Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you\u0026rsquo;ll receive a visitor\u0026rsquo;s pass that allows you to enter our building.\nSocial Dinner\nThe social dinner will take place at 7pm on April 3 in Restaurant Boom (boometenendrinken.nl), Linneausstraat 63, Amsterdam.\n","permalink":"https://ldbcouncil.org/event/fourth-tuc-meeting/","tags":["TUC Meeting"],"title":"Fourth TUC meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalsercim-angles-pb-14/","tags":[],"title":"Benchmarking Linked Open Data Management Systems"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-bookscrclinked-14-boncz-ep-14/","tags":[],"title":"Experiences with Virtuoso Cluster RDF Column Store"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confedbt-gubichev-014/","tags":[],"title":"Exploiting the query structure for efficient join ordering in SPARQL queries"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-gubichev-t-14/","tags":[],"title":"Graph Pattern Matching - Do We Have to Reinvent the Wheel?"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confwww-prat-perez-dl-14/","tags":[],"title":"High quality, scalable and parallel community detection for large real graphs"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-prat-d-14/","tags":[],"title":"How community-like is the structure of synthetically generated graphs?"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conficde-gubichev-ab-14/","tags":[],"title":"How to generate query parameters in RDF benchmarks?"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confrweb-larriba-pey-md-14/","tags":[],"title":"Introduction to Graph Databases"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/ldbc-spc-specification/","tags":[],"title":"LDBC Semantic Publishing Benchmark (SPB) - v2.0"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalsercim-pham-b-14/","tags":[],"title":"MonetDB/RDF: Discovering and Exploiting the Emergent Schema of RDF Data"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conftpctc-gubichev-b-14/","tags":[],"title":"Parameter Curation for Benchmark Queries"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/","tags":[],"title":"The Linked Data Benchmark Council: A graph and RDF industry benchmarking effort"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-martinez-bazan-d-14/","tags":[],"title":"Using semijoin programs to solve traversal queries in graph databases"},{"categories":null,"contents":"The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!\nThis will be a one day event in London on the 19 November 2013 running in collaboration with the GraphConnect event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: LDBCTUC.\nThe TUC event will include:\nIntroduction to the objectives and progress of the LDBC project Description of the progress of the benchmarks being evolved through Task Forces Users explaining their use-cases and describing the limitations they have found in current technology Industry discussions on the contents of the benchmarks We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.\nWe will kick off new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.\nAll users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu\nAgenda Logistics LDBC/TUC Background Social Network Benchmark Semantic Publishing Benchmark Agenda November 19th - Public TUC Meeting\n8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)\nshort LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)\nNOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.\n10:00 TUC Meeting Opening (Peter Boncz)\n10:10 TUC Presentations (RDF Application Descriptions)\nJohan Hjerling (BBC): BBC Linked Data and the Semantic Publishing Benchmark Andreas Both (Unister): Ontology-driven applications in an e-commerce context Nuno Carvalho (Fujitsu Laboratories Europe): Fujitsu RDF use cases and benchmarking requirements Robina Clayphan (Europeana): Europeana and Open Data 11:30 Semantic Publishing Benchmark (SPB)\nVenelin Kotsev (Ontotext - LDBC): Semantic Publishing Benchmark Task Force Update and report 12:00-13:00 Lunch at the Graph Connect venue\nTalks During Lunch:\nPedro Furtado, Jorge Bernardino (Univ. Coimbra): KEYSTONE Cost Action 13:00 TUC Presentations (Graph Application Descriptions)\nMinqi Zhou / Weining Qian (East China Normal University): Elastic and realistic social media data generation Andrew Sherlock (Shapespace): Shapespace Use Case Sebastian Verheughe (Telenor): Real-time Resource Authorization 14:00 Social Network Benchmark (SNB)\nNorbert Martinez (UPC - LDBC): Social Network Benchmark Task Force Update and Report 14:30 Break\n14:45 TUC Presentations (Graph Analytics)\nKeith Houck (IBM): Benchmarking experiences with [System G Native Store (tentative title)] Abraham Bernstein (University of Zurich): Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store Luis Ceze (University of Washington): Grappa and GraphBench Status Update 15:45 Break\n16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*\nChristian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): CIDOC-CRM Atanas Kiryakov (Ontotext): Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM) Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): Geographica: A Benchmark for Geospatial RDF Stores Xavier Lopez (Oracle): W3C Property Graph progress Thomas Scharrenbach (University Zurich) PCKS: Benchmarking Semantic Flow Processing Systems 17:20 Meeting Conclusion (Josep Larriba Pey)\n17:30 End of TUC meeting\n19:00 Social dinner\nNovember 20th - Internal LDBC Meeting\n10:00 Start\n12:30 End of meeting\ncoffee and lunch provided Logistics Date\n19th November 2013\nLocation\nThe TUC meeting will be held in The Tower hotel (Google Maps link) approximately 4 minutes walk from the GraphConnect conference in London.\nGetting there\nFrom City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy. From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. See attached. LDBC/TUC Background Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:\nLDBC_SNB_Report_Nov2013.pdf LDBC_SPB_Report_Nov2013.pdf A summary of these efforts can be read below or, for a more detailed account, please refer to: The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.\nSocial Network Benchmark The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:\nit should be understandable, and the relevance of managing such data should be understandable it should cover the complete range of interesting challenges, according to the benchmark scope the queries should be realistic, i.e., similar data and workloads are encountered in practice SNB includes a data generator for creation of synthetic social network data with the following characteristics:\ndata schema is representative of real social networks data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions the software generator is easy-to-use, configurable and scalable SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:\nInteractive Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting. The targeted systems are expected to be those that offer transactional functionality. Business Intelligence Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization. The targeted systems are expected to be those that offer an abstract query language. Graph Analytics Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language. Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation. The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures. Semantic Publishing Benchmark The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.\nThe scenario is a media organization that maintains RDF descriptions of its catalogue of creative works \u0026ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.\nThe data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.\nTwo separate workloads are modeled in SPB:\nEditorial: Simulates creating, updating and deleting creative work metadata descriptions. Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies. Aggregation: Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as \u0026ldquo;dynamic\u0026rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page. Status of the Semantic Publishing Benchmark\n","permalink":"https://ldbcouncil.org/event/third-tuc-meeting/","tags":["TUC Meeting"],"title":"Third TUC Meeting"},{"categories":null,"contents":"The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.\nThis will be a two day event in Munich on the 22/23rd April 2013.\nThe event will include:\nIntroduction to the objectives and progress of the LDBC project. Description of the progress of the benchmarks being evolved through Task Forces. Users explaining their use-cases and describing the limitations they have found in current technology. Industry discussions on the contents of the benchmarks. All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu\nAgenda Logistics Date Location Venue Getting to the TUM Campus from the Munich city center: Subway (U-Bahn) Getting to the TUM Campus from the Munich Airport Getting to the TUM Campus from Garching: U-Bahn Getting there Social Dinner Agenda April 22nd\n10:00 Registration.\n10:30 Josep Lluis Larriba Pey (UPC) - Welcome and Introduction.\n10:30 Peter Boncz (VUA): LDBC: goals and status\nSocial Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)\n11:00 Josep Lluis Larriba Pey (UPC): Social Network Benchmark Task Force\n11:30 Gustavo González (Mediapro): Graph-based User Modeling through Real-time Social Streams\n12:00 Klaus Großmann (Dshini): Neo4j at Dshini\n12:30 Lunch\nSemantic Publishing Use Cases (with discussion moderated by Barry Bishop)\n13:30 Barry Bishop (Ontotext): Semantic Publishing Benchmark Task Force\n14:00 Dave Rogers (BBC): Linked Data Platform at the BBC\n14:30 Edward Thomas (Wolters Kluwer): Semantic Publishing at Wolters Kluwer\n15:00 Coffee break\nProjects Related to LDBC\n15:30 Fabian Suchanek (MPI): \u0026ldquo;YAGO: A large knowledge base from Wikipedia and WordNet\u0026rdquo;\n16:00 Antonis Loziou (VUA): The OpenPHACTS approach to data integration\n16:30 Mirko Kämpf (Brox): \u0026ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case\u0026rdquo;\n17:00 End of first day\n19:00 Social dinner\nApril 23rd\nIndustry \u0026amp; Hardware Aspects\n10:00 Xavier Lopez (Oracle): Graph Database Performance an Oracle Perspective.pdf\n10:30 Pedro Trancoso (University of Cyprus): \u0026ldquo;Benchmarking and computer architecture: the research side\u0026rdquo;\n11:00 Coffee break\nFuture Steps and TUC feedback session\n11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force\n12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force\u0026quot;\n12:30 End of meeting\nLogistics Date 22nd and 23th April 2013\nLocation The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:\nLRZ (Leibniz-Rechenzentrum)\nBoltzmannstraße 1\n85748 Garching, Germany\nVenue To reach the campus, there are several options, including Taxi and Subway Ubahn\nGetting to the TUM Campus from the Munich city center: Subway (U-Bahn) Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.\nGetting to the TUM Campus from the Munich Airport (except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.\nS-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.\nTaxi: fare is ca. 30-40 euros.\nFor cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.\nGetting to the TUM Campus from Garching: U-Bahn The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.\nFinding LRZ@TUM\nOpenStreetMap link\nGoogle Maps link\nGetting there Flying: Munich airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.\nS-Bahn: S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.\nTaxi: taxi from the airport to the city center costs approximately 50 euros\nSocial Dinner The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)\nAddress: Hofbräuhaus, Platzl 9, Munich\n","permalink":"https://ldbcouncil.org/event/second-tuc-meeting/","tags":["TUC Meeting"],"title":"Second TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confamw-angles-br-13/","tags":[],"title":"A Practical Query Language for Graph DBs"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-angles-pdl-13/","tags":[],"title":"Benchmarking database systems for social network applications"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-ma-wqyxz-13/","tags":[],"title":"On benchmarking online social media analytical queries"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalscorrabs-1301-5121/","tags":[],"title":"Partitioning Graph Databases - A Quantitative Evaluation"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conficde-pham-13/","tags":[],"title":"Self-organizing structured RDF in MonetDB"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-gubichev-bs-13/","tags":[],"title":"Sparqling Kleene: fast property paths in RDF-3X"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalsdbsk-boncz-fgl-013/","tags":[],"title":"The Linked Data Benchmark Council Project"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsigmod-cattuto-qpa-13/","tags":[],"title":"Time-varying social networks in a graph database: a Neo4j use case"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conftpctc-boncz-ne-13/","tags":[],"title":"TPC-H Analyzed: Hidden Messages and Lessons Learned from an Influential Benchmark"},{"categories":null,"contents":"The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the 19/20th November 2012.\nSo far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:\nIntroduction by the coordinator and technical director explaining the objectives of the LDBC project Invitation to users to explain their use-cases and describe the limitations they have found in current technology Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points The exact agenda will be published here as things get finalised before the event.\nAll users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu\nAgenda Slide Logistics Date Location Venue Getting there Agenda We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.\nDay 1\n09:00 Welcome (Location: Aula Master)\n09:30 Project overview (Emphasis on task forces?) + Questionnaire results?\n10:30 Coffee break\n11:00 User talks (To gather information for use cases?)\n13:00 Lunch\n14:00 User talks (cont.)\n15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).\n16:00 Task force proposals (consortium)\n17:00 Finish first day\n20:00 Social dinner\nDay 2\n10:00 Task force discussion (consortium + TUC)\n11:00 Coffe break\n11:30 Task force discussion (consortium + TUC)\n12:30 Summaries (Task forces, use cases, \u0026hellip;) and actions\n13:00 Lunch and farewell\n15:00 LDBC Internal meeting\nSlide Opening session:\nCWI – Peter Boncz – Objectives UPC – Larri – Questionnaire User stories:\nBBC – Jem Rayfield CA Technologies – Victor Muntés Connected Discovery (Open Phacts) – Bryn Williams-Jones Elsevier – Alan Yagoda ERA7 Bioinformatics – Eduardo Pareja Press Association – Jarred McGinnis RJLee – David Neuer Yale – Lec Maj Benchmark proposals:\nPublishing benchmark proposal – Ontotext – Barry Bishop Social Network Benchmark Proposal – UPC – Larri Logistics Date 19th and 20th November 2012\nLocation The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:\nAula Master\nEdifici A3, Campus Nord UPC\nC. Jordi Girona, 1-3\n08034 Barcelona, Spain\nVenue To reach the campus, there are several options, including Taxi, Metro and Bus.\nFinding UPC\nFinding the meeting room\nGetting there Flying: Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this map of the airport). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.\nRail: The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.\nBus: The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.\nTaxi: From the airport, you can take one of Barcelona\u0026rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.\nTrain and bus: Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: http://www.barcelona-airport.com/eng/transport_eng.htm\nThe locations of the airport and the city centre\nBus map\n","permalink":"https://ldbcouncil.org/event/first-tuc-meeting/","tags":["TUC Meeting"],"title":"First TUC Meeting"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confcikm-gubichev-n-12/","tags":[],"title":"Fast approximation of Steiner trees in large graphs"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confedbt-tsialiamanis-sfcb-12/","tags":[],"title":"Heuristics-based query optimisation for SPARQL"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-confsemweb-phuoc-dpbef-12/","tags":[],"title":"Linked Stream Data Processing Engines: Facts and Figures"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-conftpctc-pham-be-12/","tags":[],"title":"S3G2: A Scalable Structure-Correlated Social Graph Generator"},{"categories":[],"contents":"","permalink":"https://ldbcouncil.org/publication/dblp-journalsdebu-erling-12/","tags":[],"title":"Virtuoso, a Hybrid RDBMS/Graph Column Store"},{"categories":null,"contents":"Redirecting\u0026hellip;\n","permalink":"https://ldbcouncil.org/events/","tags":null,"title":""},{"categories":null,"contents":"","permalink":"https://ldbcouncil.org/pages/page-name/","tags":null,"title":""},{"categories":null,"contents":"Redirecting\u0026hellip;\n","permalink":"https://ldbcouncil.org/posts/","tags":null,"title":""},{"categories":null,"contents":"Benefits The benefits of LDBC membership are:\nAccess to the internal LDBC information via its project management system and mailing lists, which include access to discussion documents, datasets, and draft benchmark specifications. Access to research resources at academic partners and connections to industry members. Right to membership of LDBC task forces and working groups. Currently, there are task forces on the Social Network Benchmark, Graphalytics, and FinBench, and working groups on graph schemas and query languages. Right to commission LDBC audits to produce official LDBC benchmark results. Note: Apart from conformance to membership agreement, including the Byelaws and the Fair Use Policy, becoming an LDBC member does not involve any further obligations. Members are not required to attend meetings, travel to events, or be involved in any task forces/working groups.\nAnnual membership fees Sponsor company/institution: 8,800 GBP Commercial company: 2,200 GBP Non-commercial institution: 1,100 GBP Individual Voting member (standard rate): 165 GBP Individual Voting member (reduced rate for students, etc.): 10 GBP Individual Associate member: no subscription fee Note: For non-sponsor organizations, there is a 2,000 GBP auditing fee, to be paid for each audit to LDBC. Sponsors are exempt from this additional fee.\nForms For the latest information on becoming an LDBC member, see the LDBC Membership – Joining and Renewing 2023 document.\nPlease fill out this form if you are an organization or individual applying to join LDBC:\nMembership form (both for individuals and organizations) Fill out one of these forms if you are just contributing to a project in the LDBC GitHub organization\nIndividual contributor license agreement (CLA) Organization contributor license agreement (CLA) In either case please email your completed form to info@ldbcouncil.org\nConstitutional documents See the constitutional documents page.\n","permalink":"https://ldbcouncil.org/becoming-a-member/","tags":null,"title":"Becoming a Member"},{"categories":null,"contents":"This page contains LDBC\u0026rsquo;s constitutional documents: its Articles of Association and Byelaws.\nCurrent versions Articles of Association (2023-03-30) Byelaws (v1.5, 2024-01-12) Old versions Articles of Association (2021-01-14) Byelaws (v1.4, 2023-05-02) Byelaws (v1.3, 2021-01-14) Byelaws (v1.2, 2020-07-28) Byelaws (v1.1, 2017-03-02) ","permalink":"https://ldbcouncil.org/constitutional-documents/","tags":null,"title":"Constitutional Documents"},{"categories":null,"contents":"If you are interested in joining our benchmark task forces, please reach out at info@ldbcouncil.org.\nLicensing Our benchmarks are licensed under the Apache Software License, Version 2.0 (license file, notice file).\nContributor License Agreement To contribute to the LDBC repositories, we ask you to sign a CLA or become an LDBC member. These options are available for both individuals and organizations.\n","permalink":"https://ldbcouncil.org/developer-community/","tags":null,"title":"Developer Community"},{"categories":null,"contents":" Group leader: Petra Selmer (Neo4j) Focus: Surveying existing graph query languages Group members Angela Bonifati (Lyon 1 University) Frank Celler (ArangoDB) Victor Lee (TigerGraph) Harsh Thakkar (Consultant OSTHUS GmBH) Jeffrey Lovitz (RedisGraph) Renzo Angles (Universidad de Talca) ","permalink":"https://ldbcouncil.org/gql-community/elwg/","tags":null,"title":"Existing Languages Working Group (ELWG)"},{"categories":null,"contents":" The text of this page is based on our Byelaws.\nLDBC Benchmarks® and LDBC Benchmark® Results LDBC expects all its members to conscientiously observe the provisions of this Fair Use Policy for LDBC Benchmarks. LDBC-approved auditors must bring this Fair Use Policy for LDBC Benchmarks to the attention of any prospective or actual Test Sponsor. The Board of Directors of LDBC is responsible for enforcing this Policy and any alleged violations should be notified to info@ldbcouncil.org.\nAn “LDBC Draft Benchmark®” is a benchmark specification and any associated tooling or datasets, which has been written by an LDBC Task Force or Working Group whose charter includes the goal of achieving adoption of that specification as an LDBC standard, in accordance with Article 33 of the Articles of Association of the Company, “Approval of Standards”. An “LDBC Benchmark®” is an LDBC Draft Benchmark once it has been adopted as an LDBC standard. A result of a performance test can be fairly described as an “LDBC Benchmark Result”, if the test\u0026mdash;which may be executed in several runs all of which use the same System Under Test (SUT)\u0026mdash;has been successfully audited by an LDBC-approved auditor, and the result is reported as part of an LDBC Benchmark Results set, so it can be interpreted in context. An audit can only be successful if the audited test uses a SUT which faithfully implements the mandatory features and chosen optional features of an LDBC Benchmark , completely exercises and generates results for all the mandatory requirements and chosen optional requirements of the LDBC Benchmark, and is conducted and audited in conformance with all the relevant provisions of the LDBC Byelaws, including the statement of Total Cost of Ownership for the SUT and the reporting of price/performance metrics, such that the reported results can legitimately be used to compare the price-weighted performance of two SUTs. “LDBC Benchmark Results” is a set of all the results of a successfully audited test. A single LDBC Benchmark Result must be reported as part of such a set. Any description or depiction of a specification that states or implies that it is an LDBC Draft Benchmark or an LDBC Benchmark when that is not the case is an infringement of LDBC’s trademark in the term “LDBC BENCHMARK”, which is registered in several major jurisdictions. The same trademark is infringed by any software which is described or promoted as being an implementation of an LDBC Draft Benchmark or LDBC Benchmark, but which does not faithfully implement the features of or does not support the mandatory requirements of the stated specification. The same trademark is infringed by any report or description of one or more performance test results which are not part of set of LDBC Benchmark Results, or in any other way states or implies that the results are endorsed by or originates from LDBC. LDBC considers the use of that trademarked term with respect to performance test results solely in accordance with these Byelaws to be essential to the purpose and reputation of the Company and its benchmark standards. Reporting of LDBC Benchmark Results Once an auditor has approved a performance test result, including all required supporting documentation, as being successfully audited, then the Members Council and the Task Force responsible for the benchmark will be notified. The Board will have the results added to the LDBC web site as an LDBC Benchmark Results set according to the following procedure:\nLDBC members will receive notification of the result via email to their designated contacts within five business days of LDBC receiving the notification. Within five business days of this notice, the LDBC administrator will post the result on the LDBC web site under the rubric \u0026ldquo;LDBC Benchmark Results” unless the result is withdrawn by the Test Sponsor in the meantime. A result may be challenged and subsequently be withdrawn by the LDBC following a review process as described in Article 7.6. A result that is not challenged within 60 days of its publication will be automatically considered valid and may not be challenged after this time, and this fact will be recorded as part of the website posting of the result. Fair Use of the trademark LDBC BENCHMARK Any party wishing to avoid infringement of the trademarked term “LDBC BENCHMARK” should follow the following guidelines relating to its fair use.\nLDBC encourages use, derived use, study, descriptions, critiques of and suggestions for improvement of LDBC Draft Benchmarks and LDBC Benchmarks. Our benchmark specifications are open-source, and we always welcome new contributors and members. These guidelines are only intended to prevent false or confusing claims relating to performance test results that are intended to be used for product comparisons.\nIf your work is derived from an LDBC Draft or standard Benchmark, or is a partial implementation, or if you are using part of one of our standards for a non-benchmarking purpose, then we would expect you to give attribution, in line with our Creative Commons CC-BY 4.0 licence. We would also suggest that you make a statement, somewhere, somehow, that includes one of these phrases “This is not an LDBC Benchmark”, “This is not an implementation of an LDBC Benchmark” or “These are not LDBC Benchmark Results”. We would also suggest that you explain, however briefly, how your work is related to LDBC standards and how it varies from them. An example that illustrates these points: you might say something like this in a presentation:\n“We used the LDBC SNB benchmark as a starting point. This isn’t the official LDBC standard: we added four queries because of X, and we don’t attempt to deal with the ACID requirement. The test results aren’t audited, so we want to be clear that this is not an LDBC Benchmark test run, and these numbers are not LDBC Benchmark Results. If you look at this link on the slide I’m showing you can see all the details of how our work is derived from, and varies from, the SNB 2.0 spec.”\nOr you might say:\n“For this example of a GQL graph type we used the LDBC SNB data model. This is nothing to do with the actual LDBC benchmark specification: we just used their data model as a use-case for illustrating what a graph schema might look like. We took this from the SNB 2.0 spec.”\n","permalink":"https://ldbcouncil.org/benchmarks/fair-use-policies/","tags":null,"title":"Fair Use Policy for LDBC Benchmarks®"},{"categories":null,"contents":" Group leaders: Leonid Libkin (ENS Paris, University of Edinburgh), Paolo Guagliardo (University of Edinburgh) Focus: Establishing formal semantics for the upcoming GQL language ","permalink":"https://ldbcouncil.org/gql-community/fswg/","tags":null,"title":"Formal Semantics Working Group (FSWG)"},{"categories":null,"contents":"The Linked Data Benchmark Council (LDBC) is a non-profit organization aiming to define standard graph benchmarks to foster a community around graph processing technologies. LDBC consists of members from both industry and academia, including organizations and individuals.\nAn overview of our activites is summarized in a lightning talk at FOSDEM 2023\u0026rsquo;s HPC room (9 minutes):\nSee also our TPCTC 2023 paper and its slide deck.\nContact To learn more about LDBC, reach out at info@ldbcouncil.org.\nPost address First Floor, Two Chamberlain Square\nBirmingham\nB3 3AX\nUnited Kingdom\n","permalink":"https://ldbcouncil.org/introduction/","tags":null,"title":"Introduction"},{"categories":null,"contents":"Group leader: Alastair Green (JCC)\nActive members:\nKoji Annoura Michael Behrisch Stephen Cannan Alin Deutsch George Fletcher Thomas Friesendal Denise Gosnell Alastair Green Cole Greer Zhihui Guo Keith Hare Jan Hidders Longbin Lai Heng Lin Alessandro Mosca Stefan Plantikow Yuya Sasaki Ognjen Savkovic Michael Schmidt Dominik Tomaszuk Yang Xia Wenyuan Yu Tao Wang Dušan Živkovic and 15+ observers See the LEX work charter which details the group\u0026rsquo;s mission, motivation, and scope of work.\n","permalink":"https://ldbcouncil.org/gql-community/lex/","tags":null,"title":"LDBC Extended GQL Schema (LEX) working group"},{"categories":null,"contents":"The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as\nanti-fraud and risk control. It is maintained by the LDBC FinBench Task Force.\nThe benchmark has one workload, Transaction Workload, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph. Its data sets are available in the Google Drive.\nFor a brief overview, see the slides presented in the 16th TUC meeting. The Financial Benchmark\u0026rsquo;s specification can be found on arXiv.\nFinBench Audit Audit results There are no audited results yet.\nCommissioning audits For auditing requests, please reach out at info@ldbcouncil.org. Audits can only be commissioned by LDBC member companies by contracting any of the LDBC-certified auditors. Note that there is a 2,000 GBP auditing fee to be paid for the LDBC for non-sponsor company members. Sponsor companies are exempt from this.\nUse of audited results Fair use policies The LDBC Social Network Benchmark is subject to the LDBC Fair Use Policies.\n","permalink":"https://ldbcouncil.org/benchmarks/finbench/","tags":null,"title":"LDBC Financial Benchmark (LDBC FinBench)"},{"categories":null,"contents":"LDBC\u0026rsquo;s working groups investigate research questions on graph query languages and language extensions for graphs.\nTheir work targeted the ISO/IEC SQL/PGQ language extension (released in June 2023) and the ISO/IEC GQL language (released in April 2024).\nLDBC has released open GQL language tools in May 2024.\nActive Working Groups LDBC Extended GQL Schema (LEX) working group Historical Working Groups Property Graph Schema Working Group Existing Languages Working Group Formal Semantics Working Group ","permalink":"https://ldbcouncil.org/gql-community/overview/","tags":null,"title":"LDBC Graph Query Working Groups"},{"categories":null,"contents":"The Graphalytics benchmark is an industrial-grade benchmark for graph analysis platforms such as Giraph, Spark GraphX, and GraphBLAS. It consists of six core algorithms, standard data sets, and reference outputs, enabling the objective comparison of graph analysis platforms.\nThe benchmark harness consists of a core component, which is extendable by a driver for each different platform implementation. The benchmark includes the following algorithms:\nbreadth-first search (BFS) PageRank (PR) weakly connected components (WCC) community detection using label propagation (CDLP) local clustering coefficient (LCC) single-source shortest paths (SSSP) The choice of these algorithms was carefully motivated, using the LDBC TUC and extensive literature surveys to ensure good coverage of scenarios. The standard data sets include both real and synthetic data sets, which are classified into intuitive “T-shirt” sizes (S, M, L, etc.).\nEach experiment set in Graphalytics consists of multiple platform runs (a platform executes an algorithm on a data set), and diverse set of experiments are carried out to evaluate different performance characteristics of a system-under-test.\nAll completed benchmarks must go through a strict validation process to ensure the integrity of the performance results.\nThe development of Graphalytics is supported by many active vendors in the field of large-scale graph analytics. Currently, Graphalytics already facilitates benchmarks for a large number of graph analytics platforms, such as GraphBLAS, Giraph, GraphX, and PGX.D, allowing comparison of the state-of-the-art system performance of both community-driven and industrial-driven platforms. To get started, the details of the Graphalyics documentation and its software components are described below.\nDocuments and repositories Benchmark specification. The source code is stored in the ldbc_graphalytics_docs repository VLDB paper ldbc_graphalytics: Generic driver ldbc_graphalytics_platforms_umbra: Umbra implementation ldbc_graphalytics_platforms_graphblas: GraphBLAS implementation Graphalytics competition 2023 In 2023, we will hold a new round of the Graphalytics competition. See the LDBC Graphalytics Benchmark presentation for an introduction to the benchmark framework and the competition\u0026rsquo;s rules.\nArtifacts:\nbenchmark framework reference implementations data sets (data sets and expected results) are available on GitHub Rules Participation is free. There are no monetary prizes. Single-node and distributed implementations are allowed. Partial implementations (e.g. just small to mid-sized data sets and only a few algorithms) are allowed. Submissions should execute each algorithm-data set combination three times. From these, the arithmetic mean of the processing times is used for ranking. The results of the competition will be published on the LDBC website in the form of leaderboards, which rank them based on performance and price-performance (adjusted for the system price). There is a global leaderboard that includes all algorithms and scale factors. Additionally, there is a separate leaderboard for each scale (S, M, L, XL, 2XL+), algorithm and system category (CPU-based/GPU-based, single-node vs. distributed) to for fine-grained comparison. Submissions are subject to code review and reproducibility attempts from the organizers. System prices should be reported following the TPC Pricing specification. Recommendations for submissions Submissions using modern hardware are welcome (GPUs, FPGAs, etc.). We encourage the use of cloud compute instances for running the benchmark (if possible). Important dates March 17: Competition is announced April 25: Confirmation of intent May 1: Submissions open June 25: Submissions close Data sets The Graphalytics data sets are compressed using zstd. The total size of the compressed archives is approx. 350GB. When decompressed, the data sets require approximately 1.5TB of disk space.\nFor detailed information on the data sets, see the table with their statistics.\nThe data sets are available in two locations:\nA public Cloudflare R2 bucket This is the primary source for the data sets and is kept up-to-date upon changes The links in the table below point to this bucket Shell script to download the data sets from Cloudflare R2 Download scripts for individual sizes: test graphs, sizes up to S, size M, size L, size XL, sizes 2XL+ CWI/SURFsara data repository Backup repository Shell script to download the data sets from SURFsara Note that some of the Graphalytics data sets were fixed in March 2023. Prior to this, they were incorrectly packaged or had missing/incorrect reference outputs for certain algorithms. If you are uncertain whether you have the correct versions, cross-check them against these MD5 checksums: datagen-9_4-fb, datagen-sf3k-fb, datagen-sf10k-fb, graph500-27, graph500-28, graph500-29, graph500-30.\ndata set #nodes #edges scale link size cit-Patents 3,774,768 16,518,947 XS cit-Patents.tar.zst 119.1 MB com-friendster 65,608,366 1,806,067,135 XL com-friendster.tar.zst 6.7 GB datagen-7_5-fb 633,432 34,185,747 S datagen-7_5-fb.tar.zst 162.3 MB datagen-7_6-fb 754,147 42,162,988 S datagen-7_6-fb.tar.zst 200.0 MB datagen-7_7-zf 13,180,508 32,791,267 S datagen-7_7-zf.tar.zst 434.5 MB datagen-7_8-zf 16,521,886 41,025,255 S datagen-7_8-zf.tar.zst 544.3 MB datagen-7_9-fb 1,387,587 85,670,523 S datagen-7_9-fb.tar.zst 401.2 MB datagen-8_0-fb 1,706,561 107,507,376 M datagen-8_0-fb.tar.zst 502.5 MB datagen-8_1-fb 2,072,117 134,267,822 M datagen-8_1-fb.tar.zst 625.4 MB datagen-8_2-zf 43,734,497 106,440,188 M datagen-8_2-zf.tar.zst 1.4 GB datagen-8_3-zf 53,525,014 130,579,909 M datagen-8_3-zf.tar.zst 1.7 GB datagen-8_4-fb 3,809,084 269,479,177 M datagen-8_4-fb.tar.zst 1.2 GB datagen-8_5-fb 4,599,739 332,026,902 L datagen-8_5-fb.tar.zst 1.5 GB datagen-8_6-fb 5,667,674 421,988,619 L datagen-8_6-fb.tar.zst 1.9 GB datagen-8_7-zf 145,050,709 340,157,363 L datagen-8_7-zf.tar.zst 4.6 GB datagen-8_8-zf 168,308,893 413,354,288 L datagen-8_8-zf.tar.zst 5.3 GB datagen-8_9-fb 10,572,901 848,681,908 L datagen-8_9-fb.tar.zst 3.7 GB datagen-9_0-fb 12,857,671 1,049,527,225 XL datagen-9_0-fb.tar.zst 4.6 GB datagen-9_1-fb 16,087,483 1,342,158,397 XL datagen-9_1-fb.tar.zst 5.8 GB datagen-9_2-zf 434,943,376 1,042,340,732 XL datagen-9_2-zf.tar.zst 13.7 GB datagen-9_3-zf 555,270,053 1,309,998,551 XL datagen-9_3-zf.tar.zst 17.4 GB datagen-9_4-fb 29,310,565 2,588,948,669 XL datagen-9_4-fb.tar.zst 14.0 GB datagen-sf3k-fb 33,484,375 2,912,009,743 XL datagen-sf3k-fb.tar.zst 12.7 GB datagen-sf10k-fb 100,218,750 9,404,822,538 2XL datagen-sf10k-fb.tar.zst 40.5 GB dota-league 61,170 50,870,313 S dota-league.tar.zst 114.3 MB graph500-22 2,396,657 64,155,735 S graph500-22.tar.zst 202.4 MB graph500-23 4,610,222 129,333,677 M graph500-23.tar.zst 410.6 MB graph500-24 8,870,942 260,379,520 M graph500-24.tar.zst 847.7 MB graph500-25 17,062,472 523,602,831 L graph500-25.tar.zst 1.7 GB graph500-26 32,804,978 1,051,922,853 XL graph500-26.tar.zst 3.4 GB graph500-27 63,081,040 2,111,642,032 XL graph500-27.tar.zst 7.1 GB graph500-28 121,242,388 4,236,163,958 2XL graph500-28.tar.zst 14.4 GB graph500-29 232,999,630 8,493,569,115 2XL graph500-29.tar.zst 29.6 GB graph500-30 447,797,986 17,022,117,362 3XL graph500-30.tar.zst 60.8 GB kgs 832,247 17,891,698 XS kgs.tar.zst 65.7 MB twitter_mpi 52,579,678 1,963,263,508 XL twitter_mpi.tar.zst 5.7 GB wiki-Talk 2,394,385 5,021,410 2XS wiki-Talk.tar.zst 34.9 MB example-directed 10 17 - example-directed.tar.zst 1.0 KB example-undirected 9 12 - example-undirected.tar.zst 1.0 KB test-bfs-directed \u0026lt;100 \u0026lt;100 - test-bfs-directed.tar.zst \u0026lt;2.0 KB test-bfs-undirected \u0026lt;100 \u0026lt;100 - test-bfs-undirected.tar.zst \u0026lt;2.0 KB test-cdlp-directed \u0026lt;100 \u0026lt;100 - test-cdlp-directed.tar.zst \u0026lt;2.0 KB test-cdlp-undirected \u0026lt;100 \u0026lt;100 - test-cdlp-undirected.tar.zst \u0026lt;2.0 KB test-pr-directed \u0026lt;100 \u0026lt;100 - test-pr-directed.tar.zst \u0026lt;2.0 KB test-pr-undirected \u0026lt;100 \u0026lt;100 - test-pr-undirected.tar.zst \u0026lt;2.0 KB test-lcc-directed \u0026lt;100 \u0026lt;100 - test-lcc-directed.tar.zst \u0026lt;2.0 KB test-lcc-undirected \u0026lt;100 \u0026lt;100 - test-lcc-undirected.tar.zst \u0026lt;2.0 KB test-wcc-directed \u0026lt;100 \u0026lt;100 - test-wcc-directed.tar.zst \u0026lt;2.0 KB test-wcc-undirected \u0026lt;100 \u0026lt;100 - test-wcc-undirected.tar.zst \u0026lt;2.0 KB test-sssp-directed \u0026lt;100 \u0026lt;100 - test-sssp-directed.tar.zst \u0026lt;2.0 KB test-sssp-undirected \u0026lt;100 \u0026lt;100 - test-sssp-undirected.tar.zst \u0026lt;2.0 KB ","permalink":"https://ldbcouncil.org/benchmarks/graphalytics/","tags":null,"title":"LDBC Graphalytics Benchmark (LDBC Graphalytics)"},{"categories":null,"contents":"The Semantic Publishing Benchmark (SPB) is an LDBC benchmark for testing the performance of RDF engines inspired by the Media/Publishing industry. In particular, LDBC worked with British Broadcasting Corporation BBC to define this benchmark, for which BBC donated workloads, ontologies and data. The publishing industry is an area where significant adoption of RDF is taking place.\nThere have been many academic benchmarks for RDF but none of these are truly industrial-grade. The SPB combines a set of complex queries under inference with continuous updates and special failover tests for systems implementing replication.\nSPB performance is measured by producing a workload of CRUD (Create, Read, Update, Delete) operations which are executed simultaneously. The benchmark offers a data generator that uses real reference data to produce datasets of various sizes and tests the scalability aspect of RDF systems. The benchmark workload consists of (a) editorial operations that add new data, alter or delete existing (b) aggregation operations that retrieve content according to various criteria. The benchmark also tests conformance for various rules inside the OWL2-RL rule-set.\nThe SPB specification contains the description of the benchmark and the data generator and all information about its software components can be found on the SPB developer page.\nSemantic Publishing Benchmark (SPB) Audited Results SF Triples RW Agents Interactive (Q/sec) Updates (ops/sec) Cost Software Hardware Test Sponsor Date FDR 3 256M 16 / 4 335.48 25.66 177,474 USD GraphDB EE 10.0.1 AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 3 256M 24 / 0 413.16 0.00 207,474 USD GraphDB EE 10.0.1 AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 3 256M 64 / 4 1121.76 9.53 652,422 USD GraphDB EE 10.0.1 3×AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 3 256M 64 / 0 985.63 0.00 562,422 USD GraphDB EE 10.0.1 3×AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 5 1B 16 / 4 105.76 10.45 177,474 USD GraphDB EE 10.0.1 AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 5 1B 24 / 0 158.10 0.00 207,474 USD GraphDB EE 10.0.1 AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 5 1B 64 / 4 372.56 4.04 652,422 USD GraphDB EE 10.0.1 3×AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 5 1B 64 / 0 408.68 0.00 562,422 USD GraphDB EE 10.0.1 3×AWS r6id.8xlarge Ontotext AD 2023-01-29 FDR, summary 1 64M 8 / 2 100.85 10.19 37,504 EUR GraphDB EE 6.2 Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM Ontotext AD 2015-04-26 FDR 1 64M 8 / 2 142.76 10.67 35,323 EUR GraphDB SE 6.3 alpha Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM Ontotext AD 2015-06-10 FDR 3 256M 8 / 2 29.90 9.50 37,504 EUR GraphDB EE 6.2 Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM Ontotext AD 2015-04-26 FDR 3 256M 8 / 2 54.64 9.50 35,323 EUR GraphDB SE 6.3 alpha Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM Ontotext AD 2015-06-10 FDR 1 64M 22 / 2 149.04 156.83 20,213 USD Virtuoso v7.50.3213 Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM OpenLink Software 2015-06-09 FDR 3 256M 22 / 2 80.62 92.71 20,213 USD Virtuoso v7.50.3213 Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM OpenLink Software 2015-06-09 FDR 3 256M 30 / 3 115.38 109.85 24,528 USD Virtuoso v7.50.3213 AWS r3.8xlarge OpenLink Software 2015-06-09 FDR 5 1B 22 / 2 32.28 72.72 20,213 USD Virtuoso v7.50.3213 Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM OpenLink Software 2015-06-09 FDR 5 1B 30 / 3 45.81 55.45 24,528 USD Virtuoso v7.50.3213 AWS r3.8xlarge OpenLink Software 2015-06-10 FDR LDBC-certified auditors SPB audits can be commissioned from the following LDBC-certified auditors:\nPjotr Scholtze ","permalink":"https://ldbcouncil.org/benchmarks/spb/","tags":null,"title":"LDBC Semantic Publishing Benchmark (LDBC-SPB)"},{"categories":null,"contents":"This file is here so that Hugo generates the page.\n","permalink":"https://ldbcouncil.org/benchmarks/snb-bi/","tags":null,"title":"LDBC SNB Business Intelligence workload"},{"categories":null,"contents":"This file is here so that Hugo generates the page.\n","permalink":"https://ldbcouncil.org/benchmarks/snb-interactive/","tags":null,"title":"LDBC SNB Interactive workload"},{"categories":null,"contents":"The Social Network Benchmark (SNB) suite defines graph workloads targeting database management systems and is maintained by the LDBC SNB Task Force.\nThe benchmark suite consists of two distinct workloads on a common dataset:\nThe Business Intelligence workload is focusing on aggregation- and join-heavy complex queries touching a large portion of the graph with microbatches of insert/delete operations. Its data sets are available in Cloudflare R2 and in the SURF/CWI repository. The Interactive workload captures transactional graph processing scenario with complex read queries that access the neighbourhood of a given node in the graph and update operations that continuously insert new data in the graph. Its data sets are available in the CWI/SURF data repository. For a brief overview, see our talk given at FOSDEM 2023\u0026rsquo;s graph developer room. The Social Network Benchmark\u0026rsquo;s specification can be found on arXiv.\nAudited results – SNB Business Intelligence workload – SNB Interactive workload Commissioning audits For auditing requests, please reach out at info@ldbcouncil.org. Audits can only be commissioned by LDBC member companies by contracting any of the LDBC-certified auditors. Note that there is a 2,000 GBP auditing fee to be paid for the LDBC for non-sponsor company members. Sponsor companies are exempt from this.\nFor a short summary of LDBC\u0026rsquo;s auditing process, including preparation steps, timelines, and pricing, see the Auditing process for the LDBC Social Network Benchmark document.\nUse of audited results Fair use policies The LDBC Social Network Benchmark is subject to the LDBC Fair Use Policies.\nRetrospective review of publications related to LDBC benchmark standards Review of 2019 preprint (sponsored by TigerGraph) Review of 2020 whitepaper (authored by Oracle) Review of the keynote at NODES 2021 (Neo4j Online Developer Expo and Summit) ","permalink":"https://ldbcouncil.org/benchmarks/snb/","tags":null,"title":"LDBC Social Network Benchmark (LDBC SNB)"},{"categories":null,"contents":"SNB Interactive (version 0.2.2) audited results SF Throughput Cost Software Hardware Test Sponsor Date Full Disclosure Report 10 101.20 ops/s 30,427 EUR Sparksee 5.1.1 2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM Sparsity Technologies SA 2015-04-27 Full Disclosure Report 30 1,287.17 ops/s 20,212 EUR Virtuoso 07.50.3213 v7fasttrack 2×Xeon2630 6-core 2.4GHz, 192GB RAM OpenLink Software 2015-04-27 Full Disclosure Report 30 86.50 ops/s 30,427 EUR Sparksee 5.1.1 2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM Sparsity Technologies SA 2015-04-27 Full Disclosure Report 100 1,200.00 ops/s 20,212 EUR Virtuoso 07.50.3213 v7fasttrack 2×Xeon2630 6-core 2.4GHz, 192GB RAM OpenLink Software 2015-04-27 Full Disclosure Report 100 81.70 ops/s 37,927 EUR Sparksee 5.1.1 2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM Sparsity Technologies SA 2015-04-27 Full Disclosure Report 300 635.00 ops/s 20,212 EUR Virtuoso 07.50.3213 v7fasttrack 2×Xeon2630 6-core 2.4GHz, 192GB RAM OpenLink Software 2015-04-27 Full Disclosure Report ","permalink":"https://ldbcouncil.org/benchmarks/snb/audited-results-v0.2.2/","tags":null,"title":"LDBC Social Network Benchmark legacy audited results"},{"categories":null,"contents":"This file is here so that Hugo generates the member page.\n","permalink":"https://ldbcouncil.org/leadership/","tags":null,"title":"Leadership"},{"categories":null,"contents":"This file is here so that Hugo generates the member page.\n","permalink":"https://ldbcouncil.org/organizational-members/","tags":null,"title":"Organizational Members"},{"categories":null,"contents":"LDBC currently offers the following benchmarks:\nGraphalytics: Graph algorithms for graph analytical platforms Financial Benchmark: Benchmark for financial workloads, targeting distributed systems Semantic Publishing Benchmark: An RDF-based benchmark for semantic databases Social Network Benchmark Suite (SNB): The SNB targets database management systems with graph-processing capabilities. It consists of two workloads, Interactive and Business Intelligence Uses of LDBC benchmarks are subject to the Fair Use Policy for LDBC Benchmarks.\n","permalink":"https://ldbcouncil.org/benchmarks/overview/","tags":null,"title":"Overview of LDBC Benchmarks"},{"categories":null,"contents":"Group leaders: Jan Hidders (Birkbeck College, University of London), Juan Sequeda (data.world)\nThe PGSWG has 4 sub-groups: PG-Basic, PG-Constraints, PG-Properties, PG-Nulls\nPG-Basic Group leader: Jan Hidders (Birkbeck College, University of London) Focus: Basic constructs and semantics Group members Alastair Green (JCC Consulting; Birkbeck College, University of London) Angela Bonifati (Lyon 1 University) Bei Li (Google) Dominik Tomaszuk (University of Bialystok) Enrico Franconi (Free University of Bozen-Bolzano) George Fletcher (Eindhoven TU) Gilles Privat (Orange S.A.) Hannes Voigt (Neo4j) Harsh Thakkar (Consultant OSTHUS GmBH) Jan Hidders (Birkbeck College, University of London) Jason Crawford (Amazon) Josh Perryman (VeracityID) Joshua Shinavier (LinkedIn) Juan Sequeda (data.world) Keith W. Hare (JCC Consulting) Koji Annoura (UTI, Inc.) Leonid Libkin (ENS Paris, University of Edinburgh) Liat Peterfreund (ENS Paris) Michael Schmidt (Amazon Web Services) Renzo Angles (Universidad de Talca) Slawek Staworko (Université de Lille) Stefania Dumbrava (Ecole Nationale Supérieure d\u0026rsquo;Informatique pour l\u0026rsquo;Industrie et l\u0026rsquo;Entreprise (ENSIIE)) Victor Lee (TigerGraph) Victor Marsault (CNRS) Wim Martens (University of Bayreuth) Wook-Shin Han (POSTECH) PG-Constraints Group leader: George Fletcher (TU Eindhoven) Focus: Key constraints and cardinality constraints Group members Alastair Green (JCC Consulting; Birkbeck College, University of London) Andrea Cali (Birkbeck College, University of London) Angela Bonifati (Lyon 1 University) Bei Li (Google) Borislav Iordanov (Kobrix) Dominik Tomaszuk (University of Bialystok) Enrico Franconi (Free University of Bozen-Bolzano) Filip Murlak (University of Warsaw) George Fletcher (Eindhoven TU) Jan Hidders (Birkbeck College, University of London) Jason Crawford (Amazon) Josh Perryman (VeracityID) Juan Sequeda (data.world) Keith W. Hare (JCC Consulting) Koji Annoura (UTI, Inc.) Leonid Libkin (ENS Paris, University of Edinburgh) Michael Schmidt (Amazon Web Services) Slawek Staworko (Université de Lille) Stefania Dumbrava (Ecole Nationale Supérieure d\u0026rsquo;Informatique pour l\u0026rsquo;Industrie et l\u0026rsquo;Entreprise (ENSIIE)) Wim Martens (University of Bayreuth) Wook-Shin Han (POSTECH) PG-Properties Group leader: Joshua Shinavier (LinkedIn) Focus: Data types for properties Group members Alastair Green (JCC Consulting; Birkbeck College, University of London) Angela Bonifati (Lyon 1 University) Bei Li (Google) Borislav Iordanov (Kobrix) Dominik Tomaszuk (University of Bialystok) Enrico Franconi (Free University of Bozen-Bolzano) Filip Murlak (University of Warsaw) George Fletcher (Eindhoven TU) Gilles Privat (Orange S.A.) Harsh Thakkar (Consultant OSTHUS GmBH) Jan Hidders (Birkbeck College, University of London) Jason Crawford (Amazon) Josh Perryman (VeracityID) Joshua Shinavier (LinkedIn) Juan Sequeda (data.world) Keith W. Hare (JCC Consulting) Koji Annoura (UTI, Inc.) Michael Schmidt (Amazon Web Services) Renzo Angles (Universidad de Talca) Stefania Dumbrava (Ecole Nationale Supérieure d\u0026rsquo;Informatique pour l\u0026rsquo;Industrie et l\u0026rsquo;Entreprise (ENSIIE)) Victor Lee (TigerGraph) Victor Marsault (CNRS) Wim Martens (University of Bayreuth) Wook-Shin Han (POSTECH) PG-Nulls Group leader: Angela Bonifati (Lyon 1 University) Focus: Null values Group members Alastair Green (JCC Consulting; Birkbeck College, University of London) Angela Bonifati (Lyon 1 University) Dominik Tomaszuk (University of Bialystok) Enrico Franconi (Free University of Bozen-Bolzano) Filip Murlak (University of Warsaw) Gilles Privat (Orange S.A.) Jan Hidders (Birkbeck College, University of London) Joshua Shinavier (LinkedIn) Juan Sequeda (data.world) Koji Annoura (UTI, Inc.) Leonid Libkin (ENS Paris, University of Edinburgh) Liat Peterfreund (ENS Paris) Michael Schmidt (Amazon Web Services) Paolo Guagliardo (University of Edinburgh) Slawek Staworko (Université de Lille) Stefania Dumbrava (Ecole Nationale Supérieure d\u0026rsquo;Informatique pour l\u0026rsquo;Industrie et l\u0026rsquo;Entreprise (ENSIIE)) Victor Lee (TigerGraph) Wim Martens (University of Bayreuth) Wook-Shin Han (POSTECH) Threshold queries Angela Bonifati (Lyon 1 University) Dominik Tomaszuk (University of Bialystok) Filip Murlak (University of Warsaw) George Fletcher (Eindhoven TU) Jan Hidders (Birkbeck College, University of London) Joshua Shinavier (LinkedIn) Matthias Hofer (University of Bayreuth) Slawek Staworko (Université de Lille) Stefania Dumbrava (Ecole Nationale Supérieure d\u0026rsquo;Informatique pour l\u0026rsquo;Industrie et l\u0026rsquo;Entreprise (ENSIIE)) Wim Martens (University of Bayreuth) ","permalink":"https://ldbcouncil.org/gql-community/pgswg/","tags":null,"title":"Property Graph Schema Working Group (PGSWG)"},{"categories":null,"contents":"See our publications page.\n","permalink":"https://ldbcouncil.org/publications/","tags":null,"title":"Publications"}]
\ No newline at end of file
diff --git a/index.xml b/index.xml
new file mode 100644
index 00000000..9776e7e4
--- /dev/null
+++ b/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/</link>
+    <description>Recent content on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 30 Aug 2024 09:00:00 -0800</lastBuildDate><atom:link href="https://ldbcouncil.org/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/industry/members/index.html b/industry/members/index.html
new file mode 100644
index 00000000..6e861009
--- /dev/null
+++ b/industry/members/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/organizational-members/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/organizational-members/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/organizational-members/">
+  </head>
+</html>
diff --git a/introduction/index.html b/introduction/index.html
new file mode 100644
index 00000000..f1fb1c65
--- /dev/null
+++ b/introduction/index.html
@@ -0,0 +1,359 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Introduction</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Introduction</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Introduction</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>The Linked Data Benchmark Council (LDBC) is a non-profit organization aiming to define standard graph benchmarks to foster a community around graph processing technologies. LDBC consists of members from both industry and academia, including <a href="/organizational-members">organizations</a> and individuals.</p>
+<p>An overview of our activites is summarized in a <a href="https://fosdem.org/2023/schedule/event/ldcb_benchmark_suite/">lightning talk at FOSDEM 2023&rsquo;s HPC room (9 minutes)</a>:</p>
+<iframe width="560" height="315" src="https://www.youtube.com/embed/q26DHnQFw54" title="YouTube video player" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen></iframe>
+<p>See also our <a href="https://ldbcouncil.org/docs/papers/ldbc-organization-tpctc2023-preprint.pdf">TPCTC 2023 paper</a> and its <a href="https://ldbcouncil.org/docs/presentations/tpctc-2023-ldbc-linked-data-benchmark-council-organization.pdf">slide deck</a>.</p>
+<h4 id="contact">Contact</h4>
+<p>To learn more about LDBC, reach out at <code>info@ldbcouncil.org</code>.</p>
+<h4 id="post-address">Post address</h4>
+<p>First Floor, Two Chamberlain Square<br>
+Birmingham<br>
+B3 3AX<br>
+United Kingdom</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/index.html b/jan-2-2006/index.html
new file mode 100644
index 00000000..79ae69b3
--- /dev/null
+++ b/jan-2-2006/index.html
@@ -0,0 +1,777 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/">Posts</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/index.xml b/jan-2-2006/index.xml
new file mode 100644
index 00000000..5125d871
--- /dev/null
+++ b/jan-2-2006/index.xml
@@ -0,0 +1,5467 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Jan 2, 2006 on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/jan-2-2006/</link>
+    <description>Recent content in Jan 2, 2006 on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright><atom:link href="https://ldbcouncil.org/jan-2-2006/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/jan-2-2006/page/1/index.html b/jan-2-2006/page/1/index.html
new file mode 100644
index 00000000..718d713b
--- /dev/null
+++ b/jan-2-2006/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/jan-2-2006/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/jan-2-2006/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/jan-2-2006/">
+  </head>
+</html>
diff --git a/jan-2-2006/page/2/index.html b/jan-2-2006/page/2/index.html
new file mode 100644
index 00000000..4383f729
--- /dev/null
+++ b/jan-2-2006/page/2/index.html
@@ -0,0 +1,804 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/3/index.html b/jan-2-2006/page/3/index.html
new file mode 100644
index 00000000..5c0c14dc
--- /dev/null
+++ b/jan-2-2006/page/3/index.html
@@ -0,0 +1,796 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/4/index.html b/jan-2-2006/page/4/index.html
new file mode 100644
index 00000000..8c64666b
--- /dev/null
+++ b/jan-2-2006/page/4/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/5/index.html b/jan-2-2006/page/5/index.html
new file mode 100644
index 00000000..dbe3d0b9
--- /dev/null
+++ b/jan-2-2006/page/5/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/6/index.html b/jan-2-2006/page/6/index.html
new file mode 100644
index 00000000..1348ec5e
--- /dev/null
+++ b/jan-2-2006/page/6/index.html
@@ -0,0 +1,776 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/7/index.html b/jan-2-2006/page/7/index.html
new file mode 100644
index 00000000..dbf5a926
--- /dev/null
+++ b/jan-2-2006/page/7/index.html
@@ -0,0 +1,794 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/8/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/jan-2-2006/page/8/index.html b/jan-2-2006/page/8/index.html
new file mode 100644
index 00000000..c3c84c14
--- /dev/null
+++ b/jan-2-2006/page/8/index.html
@@ -0,0 +1,709 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Jan 2, 2006</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Jan 2, 2006</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Jan 2, 2006</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/jan-2-2006/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/jan-2-2006/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/jan-2-2006/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/js/_vendor/bootstrap.bundle.min.js b/js/_vendor/bootstrap.bundle.min.js
new file mode 100644
index 00000000..0ded08ee
--- /dev/null
+++ b/js/_vendor/bootstrap.bundle.min.js
@@ -0,0 +1,6 @@
+/*!
+  * Bootstrap v4.6.0 (https://getbootstrap.com/)
+  * Copyright 2011-2021 The Bootstrap Authors (https://github.com/twbs/bootstrap/graphs/contributors)
+  * Licensed under MIT (https://github.com/twbs/bootstrap/blob/main/LICENSE)
+  */
+!function(t,e){"object"==typeof exports&&"undefined"!=typeof module?e(exports,require("jquery")):"function"==typeof define&&define.amd?define(["exports","jquery"],e):e((t="undefined"!=typeof globalThis?globalThis:t||self).bootstrap={},t.jQuery)}(this,(function(t,e){"use strict";function n(t){return t&&"object"==typeof t&&"default"in t?t:{default:t}}var i=n(e);function o(t,e){for(var n=0;n<e.length;n++){var i=e[n];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}function r(t,e,n){return e&&o(t.prototype,e),n&&o(t,n),t}function a(){return(a=Object.assign||function(t){for(var e=1;e<arguments.length;e++){var n=arguments[e];for(var i in n)Object.prototype.hasOwnProperty.call(n,i)&&(t[i]=n[i])}return t}).apply(this,arguments)}function s(t){var e=this,n=!1;return i.default(this).one(l.TRANSITION_END,(function(){n=!0})),setTimeout((function(){n||l.triggerTransitionEnd(e)}),t),this}var l={TRANSITION_END:"bsTransitionEnd",getUID:function(t){do{t+=~~(1e6*Math.random())}while(document.getElementById(t));return t},getSelectorFromElement:function(t){var e=t.getAttribute("data-target");if(!e||"#"===e){var n=t.getAttribute("href");e=n&&"#"!==n?n.trim():""}try{return document.querySelector(e)?e:null}catch(t){return null}},getTransitionDurationFromElement:function(t){if(!t)return 0;var e=i.default(t).css("transition-duration"),n=i.default(t).css("transition-delay"),o=parseFloat(e),r=parseFloat(n);return o||r?(e=e.split(",")[0],n=n.split(",")[0],1e3*(parseFloat(e)+parseFloat(n))):0},reflow:function(t){return t.offsetHeight},triggerTransitionEnd:function(t){i.default(t).trigger("transitionend")},supportsTransitionEnd:function(){return Boolean("transitionend")},isElement:function(t){return(t[0]||t).nodeType},typeCheckConfig:function(t,e,n){for(var i in n)if(Object.prototype.hasOwnProperty.call(n,i)){var o=n[i],r=e[i],a=r&&l.isElement(r)?"element":null===(s=r)||"undefined"==typeof s?""+s:{}.toString.call(s).match(/\s([a-z]+)/i)[1].toLowerCase();if(!new RegExp(o).test(a))throw new Error(t.toUpperCase()+': Option "'+i+'" provided type "'+a+'" but expected type "'+o+'".')}var s},findShadowRoot:function(t){if(!document.documentElement.attachShadow)return null;if("function"==typeof t.getRootNode){var e=t.getRootNode();return e instanceof ShadowRoot?e:null}return t instanceof ShadowRoot?t:t.parentNode?l.findShadowRoot(t.parentNode):null},jQueryDetection:function(){if("undefined"==typeof i.default)throw new TypeError("Bootstrap's JavaScript requires jQuery. jQuery must be included before Bootstrap's JavaScript.");var t=i.default.fn.jquery.split(" ")[0].split(".");if(t[0]<2&&t[1]<9||1===t[0]&&9===t[1]&&t[2]<1||t[0]>=4)throw new Error("Bootstrap's JavaScript requires at least jQuery v1.9.1 but less than v4.0.0")}};l.jQueryDetection(),i.default.fn.emulateTransitionEnd=s,i.default.event.special[l.TRANSITION_END]={bindType:"transitionend",delegateType:"transitionend",handle:function(t){if(i.default(t.target).is(this))return t.handleObj.handler.apply(this,arguments)}};var u="alert",f=i.default.fn[u],d=function(){function t(t){this._element=t}var e=t.prototype;return e.close=function(t){var e=this._element;t&&(e=this._getRootElement(t)),this._triggerCloseEvent(e).isDefaultPrevented()||this._removeElement(e)},e.dispose=function(){i.default.removeData(this._element,"bs.alert"),this._element=null},e._getRootElement=function(t){var e=l.getSelectorFromElement(t),n=!1;return e&&(n=document.querySelector(e)),n||(n=i.default(t).closest(".alert")[0]),n},e._triggerCloseEvent=function(t){var e=i.default.Event("close.bs.alert");return i.default(t).trigger(e),e},e._removeElement=function(t){var e=this;if(i.default(t).removeClass("show"),i.default(t).hasClass("fade")){var n=l.getTransitionDurationFromElement(t);i.default(t).one(l.TRANSITION_END,(function(n){return e._destroyElement(t,n)})).emulateTransitionEnd(n)}else this._destroyElement(t)},e._destroyElement=function(t){i.default(t).detach().trigger("closed.bs.alert").remove()},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this),o=n.data("bs.alert");o||(o=new t(this),n.data("bs.alert",o)),"close"===e&&o[e](this)}))},t._handleDismiss=function(t){return function(e){e&&e.preventDefault(),t.close(this)}},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}}]),t}();i.default(document).on("click.bs.alert.data-api",'[data-dismiss="alert"]',d._handleDismiss(new d)),i.default.fn[u]=d._jQueryInterface,i.default.fn[u].Constructor=d,i.default.fn[u].noConflict=function(){return i.default.fn[u]=f,d._jQueryInterface};var c=i.default.fn.button,h=function(){function t(t){this._element=t,this.shouldAvoidTriggerChange=!1}var e=t.prototype;return e.toggle=function(){var t=!0,e=!0,n=i.default(this._element).closest('[data-toggle="buttons"]')[0];if(n){var o=this._element.querySelector('input:not([type="hidden"])');if(o){if("radio"===o.type)if(o.checked&&this._element.classList.contains("active"))t=!1;else{var r=n.querySelector(".active");r&&i.default(r).removeClass("active")}t&&("checkbox"!==o.type&&"radio"!==o.type||(o.checked=!this._element.classList.contains("active")),this.shouldAvoidTriggerChange||i.default(o).trigger("change")),o.focus(),e=!1}}this._element.hasAttribute("disabled")||this._element.classList.contains("disabled")||(e&&this._element.setAttribute("aria-pressed",!this._element.classList.contains("active")),t&&i.default(this._element).toggleClass("active"))},e.dispose=function(){i.default.removeData(this._element,"bs.button"),this._element=null},t._jQueryInterface=function(e,n){return this.each((function(){var o=i.default(this),r=o.data("bs.button");r||(r=new t(this),o.data("bs.button",r)),r.shouldAvoidTriggerChange=n,"toggle"===e&&r[e]()}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}}]),t}();i.default(document).on("click.bs.button.data-api",'[data-toggle^="button"]',(function(t){var e=t.target,n=e;if(i.default(e).hasClass("btn")||(e=i.default(e).closest(".btn")[0]),!e||e.hasAttribute("disabled")||e.classList.contains("disabled"))t.preventDefault();else{var o=e.querySelector('input:not([type="hidden"])');if(o&&(o.hasAttribute("disabled")||o.classList.contains("disabled")))return void t.preventDefault();"INPUT"!==n.tagName&&"LABEL"===e.tagName||h._jQueryInterface.call(i.default(e),"toggle","INPUT"===n.tagName)}})).on("focus.bs.button.data-api blur.bs.button.data-api",'[data-toggle^="button"]',(function(t){var e=i.default(t.target).closest(".btn")[0];i.default(e).toggleClass("focus",/^focus(in)?$/.test(t.type))})),i.default(window).on("load.bs.button.data-api",(function(){for(var t=[].slice.call(document.querySelectorAll('[data-toggle="buttons"] .btn')),e=0,n=t.length;e<n;e++){var i=t[e],o=i.querySelector('input:not([type="hidden"])');o.checked||o.hasAttribute("checked")?i.classList.add("active"):i.classList.remove("active")}for(var r=0,a=(t=[].slice.call(document.querySelectorAll('[data-toggle="button"]'))).length;r<a;r++){var s=t[r];"true"===s.getAttribute("aria-pressed")?s.classList.add("active"):s.classList.remove("active")}})),i.default.fn.button=h._jQueryInterface,i.default.fn.button.Constructor=h,i.default.fn.button.noConflict=function(){return i.default.fn.button=c,h._jQueryInterface};var p="carousel",m=".bs.carousel",g=i.default.fn[p],v={interval:5e3,keyboard:!0,slide:!1,pause:"hover",wrap:!0,touch:!0},_={interval:"(number|boolean)",keyboard:"boolean",slide:"(boolean|string)",pause:"(string|boolean)",wrap:"boolean",touch:"boolean"},b={TOUCH:"touch",PEN:"pen"},y=function(){function t(t,e){this._items=null,this._interval=null,this._activeElement=null,this._isPaused=!1,this._isSliding=!1,this.touchTimeout=null,this.touchStartX=0,this.touchDeltaX=0,this._config=this._getConfig(e),this._element=t,this._indicatorsElement=this._element.querySelector(".carousel-indicators"),this._touchSupported="ontouchstart"in document.documentElement||navigator.maxTouchPoints>0,this._pointerEvent=Boolean(window.PointerEvent||window.MSPointerEvent),this._addEventListeners()}var e=t.prototype;return e.next=function(){this._isSliding||this._slide("next")},e.nextWhenVisible=function(){var t=i.default(this._element);!document.hidden&&t.is(":visible")&&"hidden"!==t.css("visibility")&&this.next()},e.prev=function(){this._isSliding||this._slide("prev")},e.pause=function(t){t||(this._isPaused=!0),this._element.querySelector(".carousel-item-next, .carousel-item-prev")&&(l.triggerTransitionEnd(this._element),this.cycle(!0)),clearInterval(this._interval),this._interval=null},e.cycle=function(t){t||(this._isPaused=!1),this._interval&&(clearInterval(this._interval),this._interval=null),this._config.interval&&!this._isPaused&&(this._updateInterval(),this._interval=setInterval((document.visibilityState?this.nextWhenVisible:this.next).bind(this),this._config.interval))},e.to=function(t){var e=this;this._activeElement=this._element.querySelector(".active.carousel-item");var n=this._getItemIndex(this._activeElement);if(!(t>this._items.length-1||t<0))if(this._isSliding)i.default(this._element).one("slid.bs.carousel",(function(){return e.to(t)}));else{if(n===t)return this.pause(),void this.cycle();var o=t>n?"next":"prev";this._slide(o,this._items[t])}},e.dispose=function(){i.default(this._element).off(m),i.default.removeData(this._element,"bs.carousel"),this._items=null,this._config=null,this._element=null,this._interval=null,this._isPaused=null,this._isSliding=null,this._activeElement=null,this._indicatorsElement=null},e._getConfig=function(t){return t=a({},v,t),l.typeCheckConfig(p,t,_),t},e._handleSwipe=function(){var t=Math.abs(this.touchDeltaX);if(!(t<=40)){var e=t/this.touchDeltaX;this.touchDeltaX=0,e>0&&this.prev(),e<0&&this.next()}},e._addEventListeners=function(){var t=this;this._config.keyboard&&i.default(this._element).on("keydown.bs.carousel",(function(e){return t._keydown(e)})),"hover"===this._config.pause&&i.default(this._element).on("mouseenter.bs.carousel",(function(e){return t.pause(e)})).on("mouseleave.bs.carousel",(function(e){return t.cycle(e)})),this._config.touch&&this._addTouchEventListeners()},e._addTouchEventListeners=function(){var t=this;if(this._touchSupported){var e=function(e){t._pointerEvent&&b[e.originalEvent.pointerType.toUpperCase()]?t.touchStartX=e.originalEvent.clientX:t._pointerEvent||(t.touchStartX=e.originalEvent.touches[0].clientX)},n=function(e){t._pointerEvent&&b[e.originalEvent.pointerType.toUpperCase()]&&(t.touchDeltaX=e.originalEvent.clientX-t.touchStartX),t._handleSwipe(),"hover"===t._config.pause&&(t.pause(),t.touchTimeout&&clearTimeout(t.touchTimeout),t.touchTimeout=setTimeout((function(e){return t.cycle(e)}),500+t._config.interval))};i.default(this._element.querySelectorAll(".carousel-item img")).on("dragstart.bs.carousel",(function(t){return t.preventDefault()})),this._pointerEvent?(i.default(this._element).on("pointerdown.bs.carousel",(function(t){return e(t)})),i.default(this._element).on("pointerup.bs.carousel",(function(t){return n(t)})),this._element.classList.add("pointer-event")):(i.default(this._element).on("touchstart.bs.carousel",(function(t){return e(t)})),i.default(this._element).on("touchmove.bs.carousel",(function(e){return function(e){e.originalEvent.touches&&e.originalEvent.touches.length>1?t.touchDeltaX=0:t.touchDeltaX=e.originalEvent.touches[0].clientX-t.touchStartX}(e)})),i.default(this._element).on("touchend.bs.carousel",(function(t){return n(t)})))}},e._keydown=function(t){if(!/input|textarea/i.test(t.target.tagName))switch(t.which){case 37:t.preventDefault(),this.prev();break;case 39:t.preventDefault(),this.next()}},e._getItemIndex=function(t){return this._items=t&&t.parentNode?[].slice.call(t.parentNode.querySelectorAll(".carousel-item")):[],this._items.indexOf(t)},e._getItemByDirection=function(t,e){var n="next"===t,i="prev"===t,o=this._getItemIndex(e),r=this._items.length-1;if((i&&0===o||n&&o===r)&&!this._config.wrap)return e;var a=(o+("prev"===t?-1:1))%this._items.length;return-1===a?this._items[this._items.length-1]:this._items[a]},e._triggerSlideEvent=function(t,e){var n=this._getItemIndex(t),o=this._getItemIndex(this._element.querySelector(".active.carousel-item")),r=i.default.Event("slide.bs.carousel",{relatedTarget:t,direction:e,from:o,to:n});return i.default(this._element).trigger(r),r},e._setActiveIndicatorElement=function(t){if(this._indicatorsElement){var e=[].slice.call(this._indicatorsElement.querySelectorAll(".active"));i.default(e).removeClass("active");var n=this._indicatorsElement.children[this._getItemIndex(t)];n&&i.default(n).addClass("active")}},e._updateInterval=function(){var t=this._activeElement||this._element.querySelector(".active.carousel-item");if(t){var e=parseInt(t.getAttribute("data-interval"),10);e?(this._config.defaultInterval=this._config.defaultInterval||this._config.interval,this._config.interval=e):this._config.interval=this._config.defaultInterval||this._config.interval}},e._slide=function(t,e){var n,o,r,a=this,s=this._element.querySelector(".active.carousel-item"),u=this._getItemIndex(s),f=e||s&&this._getItemByDirection(t,s),d=this._getItemIndex(f),c=Boolean(this._interval);if("next"===t?(n="carousel-item-left",o="carousel-item-next",r="left"):(n="carousel-item-right",o="carousel-item-prev",r="right"),f&&i.default(f).hasClass("active"))this._isSliding=!1;else if(!this._triggerSlideEvent(f,r).isDefaultPrevented()&&s&&f){this._isSliding=!0,c&&this.pause(),this._setActiveIndicatorElement(f),this._activeElement=f;var h=i.default.Event("slid.bs.carousel",{relatedTarget:f,direction:r,from:u,to:d});if(i.default(this._element).hasClass("slide")){i.default(f).addClass(o),l.reflow(f),i.default(s).addClass(n),i.default(f).addClass(n);var p=l.getTransitionDurationFromElement(s);i.default(s).one(l.TRANSITION_END,(function(){i.default(f).removeClass(n+" "+o).addClass("active"),i.default(s).removeClass("active "+o+" "+n),a._isSliding=!1,setTimeout((function(){return i.default(a._element).trigger(h)}),0)})).emulateTransitionEnd(p)}else i.default(s).removeClass("active"),i.default(f).addClass("active"),this._isSliding=!1,i.default(this._element).trigger(h);c&&this.cycle()}},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this).data("bs.carousel"),o=a({},v,i.default(this).data());"object"==typeof e&&(o=a({},o,e));var r="string"==typeof e?e:o.slide;if(n||(n=new t(this,o),i.default(this).data("bs.carousel",n)),"number"==typeof e)n.to(e);else if("string"==typeof r){if("undefined"==typeof n[r])throw new TypeError('No method named "'+r+'"');n[r]()}else o.interval&&o.ride&&(n.pause(),n.cycle())}))},t._dataApiClickHandler=function(e){var n=l.getSelectorFromElement(this);if(n){var o=i.default(n)[0];if(o&&i.default(o).hasClass("carousel")){var r=a({},i.default(o).data(),i.default(this).data()),s=this.getAttribute("data-slide-to");s&&(r.interval=!1),t._jQueryInterface.call(i.default(o),r),s&&i.default(o).data("bs.carousel").to(s),e.preventDefault()}}},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return v}}]),t}();i.default(document).on("click.bs.carousel.data-api","[data-slide], [data-slide-to]",y._dataApiClickHandler),i.default(window).on("load.bs.carousel.data-api",(function(){for(var t=[].slice.call(document.querySelectorAll('[data-ride="carousel"]')),e=0,n=t.length;e<n;e++){var o=i.default(t[e]);y._jQueryInterface.call(o,o.data())}})),i.default.fn[p]=y._jQueryInterface,i.default.fn[p].Constructor=y,i.default.fn[p].noConflict=function(){return i.default.fn[p]=g,y._jQueryInterface};var w="collapse",E=i.default.fn[w],T={toggle:!0,parent:""},C={toggle:"boolean",parent:"(string|element)"},S=function(){function t(t,e){this._isTransitioning=!1,this._element=t,this._config=this._getConfig(e),this._triggerArray=[].slice.call(document.querySelectorAll('[data-toggle="collapse"][href="#'+t.id+'"],[data-toggle="collapse"][data-target="#'+t.id+'"]'));for(var n=[].slice.call(document.querySelectorAll('[data-toggle="collapse"]')),i=0,o=n.length;i<o;i++){var r=n[i],a=l.getSelectorFromElement(r),s=[].slice.call(document.querySelectorAll(a)).filter((function(e){return e===t}));null!==a&&s.length>0&&(this._selector=a,this._triggerArray.push(r))}this._parent=this._config.parent?this._getParent():null,this._config.parent||this._addAriaAndCollapsedClass(this._element,this._triggerArray),this._config.toggle&&this.toggle()}var e=t.prototype;return e.toggle=function(){i.default(this._element).hasClass("show")?this.hide():this.show()},e.show=function(){var e,n,o=this;if(!this._isTransitioning&&!i.default(this._element).hasClass("show")&&(this._parent&&0===(e=[].slice.call(this._parent.querySelectorAll(".show, .collapsing")).filter((function(t){return"string"==typeof o._config.parent?t.getAttribute("data-parent")===o._config.parent:t.classList.contains("collapse")}))).length&&(e=null),!(e&&(n=i.default(e).not(this._selector).data("bs.collapse"))&&n._isTransitioning))){var r=i.default.Event("show.bs.collapse");if(i.default(this._element).trigger(r),!r.isDefaultPrevented()){e&&(t._jQueryInterface.call(i.default(e).not(this._selector),"hide"),n||i.default(e).data("bs.collapse",null));var a=this._getDimension();i.default(this._element).removeClass("collapse").addClass("collapsing"),this._element.style[a]=0,this._triggerArray.length&&i.default(this._triggerArray).removeClass("collapsed").attr("aria-expanded",!0),this.setTransitioning(!0);var s="scroll"+(a[0].toUpperCase()+a.slice(1)),u=l.getTransitionDurationFromElement(this._element);i.default(this._element).one(l.TRANSITION_END,(function(){i.default(o._element).removeClass("collapsing").addClass("collapse show"),o._element.style[a]="",o.setTransitioning(!1),i.default(o._element).trigger("shown.bs.collapse")})).emulateTransitionEnd(u),this._element.style[a]=this._element[s]+"px"}}},e.hide=function(){var t=this;if(!this._isTransitioning&&i.default(this._element).hasClass("show")){var e=i.default.Event("hide.bs.collapse");if(i.default(this._element).trigger(e),!e.isDefaultPrevented()){var n=this._getDimension();this._element.style[n]=this._element.getBoundingClientRect()[n]+"px",l.reflow(this._element),i.default(this._element).addClass("collapsing").removeClass("collapse show");var o=this._triggerArray.length;if(o>0)for(var r=0;r<o;r++){var a=this._triggerArray[r],s=l.getSelectorFromElement(a);if(null!==s)i.default([].slice.call(document.querySelectorAll(s))).hasClass("show")||i.default(a).addClass("collapsed").attr("aria-expanded",!1)}this.setTransitioning(!0);this._element.style[n]="";var u=l.getTransitionDurationFromElement(this._element);i.default(this._element).one(l.TRANSITION_END,(function(){t.setTransitioning(!1),i.default(t._element).removeClass("collapsing").addClass("collapse").trigger("hidden.bs.collapse")})).emulateTransitionEnd(u)}}},e.setTransitioning=function(t){this._isTransitioning=t},e.dispose=function(){i.default.removeData(this._element,"bs.collapse"),this._config=null,this._parent=null,this._element=null,this._triggerArray=null,this._isTransitioning=null},e._getConfig=function(t){return(t=a({},T,t)).toggle=Boolean(t.toggle),l.typeCheckConfig(w,t,C),t},e._getDimension=function(){return i.default(this._element).hasClass("width")?"width":"height"},e._getParent=function(){var e,n=this;l.isElement(this._config.parent)?(e=this._config.parent,"undefined"!=typeof this._config.parent.jquery&&(e=this._config.parent[0])):e=document.querySelector(this._config.parent);var o='[data-toggle="collapse"][data-parent="'+this._config.parent+'"]',r=[].slice.call(e.querySelectorAll(o));return i.default(r).each((function(e,i){n._addAriaAndCollapsedClass(t._getTargetFromElement(i),[i])})),e},e._addAriaAndCollapsedClass=function(t,e){var n=i.default(t).hasClass("show");e.length&&i.default(e).toggleClass("collapsed",!n).attr("aria-expanded",n)},t._getTargetFromElement=function(t){var e=l.getSelectorFromElement(t);return e?document.querySelector(e):null},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this),o=n.data("bs.collapse"),r=a({},T,n.data(),"object"==typeof e&&e?e:{});if(!o&&r.toggle&&"string"==typeof e&&/show|hide/.test(e)&&(r.toggle=!1),o||(o=new t(this,r),n.data("bs.collapse",o)),"string"==typeof e){if("undefined"==typeof o[e])throw new TypeError('No method named "'+e+'"');o[e]()}}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return T}}]),t}();i.default(document).on("click.bs.collapse.data-api",'[data-toggle="collapse"]',(function(t){"A"===t.currentTarget.tagName&&t.preventDefault();var e=i.default(this),n=l.getSelectorFromElement(this),o=[].slice.call(document.querySelectorAll(n));i.default(o).each((function(){var t=i.default(this),n=t.data("bs.collapse")?"toggle":e.data();S._jQueryInterface.call(t,n)}))})),i.default.fn[w]=S._jQueryInterface,i.default.fn[w].Constructor=S,i.default.fn[w].noConflict=function(){return i.default.fn[w]=E,S._jQueryInterface};var D="undefined"!=typeof window&&"undefined"!=typeof document&&"undefined"!=typeof navigator,N=function(){for(var t=["Edge","Trident","Firefox"],e=0;e<t.length;e+=1)if(D&&navigator.userAgent.indexOf(t[e])>=0)return 1;return 0}();var k=D&&window.Promise?function(t){var e=!1;return function(){e||(e=!0,window.Promise.resolve().then((function(){e=!1,t()})))}}:function(t){var e=!1;return function(){e||(e=!0,setTimeout((function(){e=!1,t()}),N))}};function A(t){return t&&"[object Function]"==={}.toString.call(t)}function I(t,e){if(1!==t.nodeType)return[];var n=t.ownerDocument.defaultView.getComputedStyle(t,null);return e?n[e]:n}function O(t){return"HTML"===t.nodeName?t:t.parentNode||t.host}function x(t){if(!t)return document.body;switch(t.nodeName){case"HTML":case"BODY":return t.ownerDocument.body;case"#document":return t.body}var e=I(t),n=e.overflow,i=e.overflowX,o=e.overflowY;return/(auto|scroll|overlay)/.test(n+o+i)?t:x(O(t))}function j(t){return t&&t.referenceNode?t.referenceNode:t}var L=D&&!(!window.MSInputMethodContext||!document.documentMode),P=D&&/MSIE 10/.test(navigator.userAgent);function F(t){return 11===t?L:10===t?P:L||P}function R(t){if(!t)return document.documentElement;for(var e=F(10)?document.body:null,n=t.offsetParent||null;n===e&&t.nextElementSibling;)n=(t=t.nextElementSibling).offsetParent;var i=n&&n.nodeName;return i&&"BODY"!==i&&"HTML"!==i?-1!==["TH","TD","TABLE"].indexOf(n.nodeName)&&"static"===I(n,"position")?R(n):n:t?t.ownerDocument.documentElement:document.documentElement}function H(t){return null!==t.parentNode?H(t.parentNode):t}function M(t,e){if(!(t&&t.nodeType&&e&&e.nodeType))return document.documentElement;var n=t.compareDocumentPosition(e)&Node.DOCUMENT_POSITION_FOLLOWING,i=n?t:e,o=n?e:t,r=document.createRange();r.setStart(i,0),r.setEnd(o,0);var a,s,l=r.commonAncestorContainer;if(t!==l&&e!==l||i.contains(o))return"BODY"===(s=(a=l).nodeName)||"HTML"!==s&&R(a.firstElementChild)!==a?R(l):l;var u=H(t);return u.host?M(u.host,e):M(t,H(e).host)}function q(t){var e=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"top",n="top"===e?"scrollTop":"scrollLeft",i=t.nodeName;if("BODY"===i||"HTML"===i){var o=t.ownerDocument.documentElement,r=t.ownerDocument.scrollingElement||o;return r[n]}return t[n]}function B(t,e){var n=arguments.length>2&&void 0!==arguments[2]&&arguments[2],i=q(e,"top"),o=q(e,"left"),r=n?-1:1;return t.top+=i*r,t.bottom+=i*r,t.left+=o*r,t.right+=o*r,t}function Q(t,e){var n="x"===e?"Left":"Top",i="Left"===n?"Right":"Bottom";return parseFloat(t["border"+n+"Width"])+parseFloat(t["border"+i+"Width"])}function W(t,e,n,i){return Math.max(e["offset"+t],e["scroll"+t],n["client"+t],n["offset"+t],n["scroll"+t],F(10)?parseInt(n["offset"+t])+parseInt(i["margin"+("Height"===t?"Top":"Left")])+parseInt(i["margin"+("Height"===t?"Bottom":"Right")]):0)}function U(t){var e=t.body,n=t.documentElement,i=F(10)&&getComputedStyle(n);return{height:W("Height",e,n,i),width:W("Width",e,n,i)}}var V=function(t,e){if(!(t instanceof e))throw new TypeError("Cannot call a class as a function")},Y=function(){function t(t,e){for(var n=0;n<e.length;n++){var i=e[n];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}return function(e,n,i){return n&&t(e.prototype,n),i&&t(e,i),e}}(),z=function(t,e,n){return e in t?Object.defineProperty(t,e,{value:n,enumerable:!0,configurable:!0,writable:!0}):t[e]=n,t},X=Object.assign||function(t){for(var e=1;e<arguments.length;e++){var n=arguments[e];for(var i in n)Object.prototype.hasOwnProperty.call(n,i)&&(t[i]=n[i])}return t};function K(t){return X({},t,{right:t.left+t.width,bottom:t.top+t.height})}function G(t){var e={};try{if(F(10)){e=t.getBoundingClientRect();var n=q(t,"top"),i=q(t,"left");e.top+=n,e.left+=i,e.bottom+=n,e.right+=i}else e=t.getBoundingClientRect()}catch(t){}var o={left:e.left,top:e.top,width:e.right-e.left,height:e.bottom-e.top},r="HTML"===t.nodeName?U(t.ownerDocument):{},a=r.width||t.clientWidth||o.width,s=r.height||t.clientHeight||o.height,l=t.offsetWidth-a,u=t.offsetHeight-s;if(l||u){var f=I(t);l-=Q(f,"x"),u-=Q(f,"y"),o.width-=l,o.height-=u}return K(o)}function $(t,e){var n=arguments.length>2&&void 0!==arguments[2]&&arguments[2],i=F(10),o="HTML"===e.nodeName,r=G(t),a=G(e),s=x(t),l=I(e),u=parseFloat(l.borderTopWidth),f=parseFloat(l.borderLeftWidth);n&&o&&(a.top=Math.max(a.top,0),a.left=Math.max(a.left,0));var d=K({top:r.top-a.top-u,left:r.left-a.left-f,width:r.width,height:r.height});if(d.marginTop=0,d.marginLeft=0,!i&&o){var c=parseFloat(l.marginTop),h=parseFloat(l.marginLeft);d.top-=u-c,d.bottom-=u-c,d.left-=f-h,d.right-=f-h,d.marginTop=c,d.marginLeft=h}return(i&&!n?e.contains(s):e===s&&"BODY"!==s.nodeName)&&(d=B(d,e)),d}function J(t){var e=arguments.length>1&&void 0!==arguments[1]&&arguments[1],n=t.ownerDocument.documentElement,i=$(t,n),o=Math.max(n.clientWidth,window.innerWidth||0),r=Math.max(n.clientHeight,window.innerHeight||0),a=e?0:q(n),s=e?0:q(n,"left"),l={top:a-i.top+i.marginTop,left:s-i.left+i.marginLeft,width:o,height:r};return K(l)}function Z(t){var e=t.nodeName;if("BODY"===e||"HTML"===e)return!1;if("fixed"===I(t,"position"))return!0;var n=O(t);return!!n&&Z(n)}function tt(t){if(!t||!t.parentElement||F())return document.documentElement;for(var e=t.parentElement;e&&"none"===I(e,"transform");)e=e.parentElement;return e||document.documentElement}function et(t,e,n,i){var o=arguments.length>4&&void 0!==arguments[4]&&arguments[4],r={top:0,left:0},a=o?tt(t):M(t,j(e));if("viewport"===i)r=J(a,o);else{var s=void 0;"scrollParent"===i?"BODY"===(s=x(O(e))).nodeName&&(s=t.ownerDocument.documentElement):s="window"===i?t.ownerDocument.documentElement:i;var l=$(s,a,o);if("HTML"!==s.nodeName||Z(a))r=l;else{var u=U(t.ownerDocument),f=u.height,d=u.width;r.top+=l.top-l.marginTop,r.bottom=f+l.top,r.left+=l.left-l.marginLeft,r.right=d+l.left}}var c="number"==typeof(n=n||0);return r.left+=c?n:n.left||0,r.top+=c?n:n.top||0,r.right-=c?n:n.right||0,r.bottom-=c?n:n.bottom||0,r}function nt(t){return t.width*t.height}function it(t,e,n,i,o){var r=arguments.length>5&&void 0!==arguments[5]?arguments[5]:0;if(-1===t.indexOf("auto"))return t;var a=et(n,i,r,o),s={top:{width:a.width,height:e.top-a.top},right:{width:a.right-e.right,height:a.height},bottom:{width:a.width,height:a.bottom-e.bottom},left:{width:e.left-a.left,height:a.height}},l=Object.keys(s).map((function(t){return X({key:t},s[t],{area:nt(s[t])})})).sort((function(t,e){return e.area-t.area})),u=l.filter((function(t){var e=t.width,i=t.height;return e>=n.clientWidth&&i>=n.clientHeight})),f=u.length>0?u[0].key:l[0].key,d=t.split("-")[1];return f+(d?"-"+d:"")}function ot(t,e,n){var i=arguments.length>3&&void 0!==arguments[3]?arguments[3]:null,o=i?tt(e):M(e,j(n));return $(n,o,i)}function rt(t){var e=t.ownerDocument.defaultView.getComputedStyle(t),n=parseFloat(e.marginTop||0)+parseFloat(e.marginBottom||0),i=parseFloat(e.marginLeft||0)+parseFloat(e.marginRight||0);return{width:t.offsetWidth+i,height:t.offsetHeight+n}}function at(t){var e={left:"right",right:"left",bottom:"top",top:"bottom"};return t.replace(/left|right|bottom|top/g,(function(t){return e[t]}))}function st(t,e,n){n=n.split("-")[0];var i=rt(t),o={width:i.width,height:i.height},r=-1!==["right","left"].indexOf(n),a=r?"top":"left",s=r?"left":"top",l=r?"height":"width",u=r?"width":"height";return o[a]=e[a]+e[l]/2-i[l]/2,o[s]=n===s?e[s]-i[u]:e[at(s)],o}function lt(t,e){return Array.prototype.find?t.find(e):t.filter(e)[0]}function ut(t,e,n){return(void 0===n?t:t.slice(0,function(t,e,n){if(Array.prototype.findIndex)return t.findIndex((function(t){return t[e]===n}));var i=lt(t,(function(t){return t[e]===n}));return t.indexOf(i)}(t,"name",n))).forEach((function(t){t.function&&console.warn("`modifier.function` is deprecated, use `modifier.fn`!");var n=t.function||t.fn;t.enabled&&A(n)&&(e.offsets.popper=K(e.offsets.popper),e.offsets.reference=K(e.offsets.reference),e=n(e,t))})),e}function ft(){if(!this.state.isDestroyed){var t={instance:this,styles:{},arrowStyles:{},attributes:{},flipped:!1,offsets:{}};t.offsets.reference=ot(this.state,this.popper,this.reference,this.options.positionFixed),t.placement=it(this.options.placement,t.offsets.reference,this.popper,this.reference,this.options.modifiers.flip.boundariesElement,this.options.modifiers.flip.padding),t.originalPlacement=t.placement,t.positionFixed=this.options.positionFixed,t.offsets.popper=st(this.popper,t.offsets.reference,t.placement),t.offsets.popper.position=this.options.positionFixed?"fixed":"absolute",t=ut(this.modifiers,t),this.state.isCreated?this.options.onUpdate(t):(this.state.isCreated=!0,this.options.onCreate(t))}}function dt(t,e){return t.some((function(t){var n=t.name;return t.enabled&&n===e}))}function ct(t){for(var e=[!1,"ms","Webkit","Moz","O"],n=t.charAt(0).toUpperCase()+t.slice(1),i=0;i<e.length;i++){var o=e[i],r=o?""+o+n:t;if("undefined"!=typeof document.body.style[r])return r}return null}function ht(){return this.state.isDestroyed=!0,dt(this.modifiers,"applyStyle")&&(this.popper.removeAttribute("x-placement"),this.popper.style.position="",this.popper.style.top="",this.popper.style.left="",this.popper.style.right="",this.popper.style.bottom="",this.popper.style.willChange="",this.popper.style[ct("transform")]=""),this.disableEventListeners(),this.options.removeOnDestroy&&this.popper.parentNode.removeChild(this.popper),this}function pt(t){var e=t.ownerDocument;return e?e.defaultView:window}function mt(t,e,n,i){n.updateBound=i,pt(t).addEventListener("resize",n.updateBound,{passive:!0});var o=x(t);return function t(e,n,i,o){var r="BODY"===e.nodeName,a=r?e.ownerDocument.defaultView:e;a.addEventListener(n,i,{passive:!0}),r||t(x(a.parentNode),n,i,o),o.push(a)}(o,"scroll",n.updateBound,n.scrollParents),n.scrollElement=o,n.eventsEnabled=!0,n}function gt(){this.state.eventsEnabled||(this.state=mt(this.reference,this.options,this.state,this.scheduleUpdate))}function vt(){var t,e;this.state.eventsEnabled&&(cancelAnimationFrame(this.scheduleUpdate),this.state=(t=this.reference,e=this.state,pt(t).removeEventListener("resize",e.updateBound),e.scrollParents.forEach((function(t){t.removeEventListener("scroll",e.updateBound)})),e.updateBound=null,e.scrollParents=[],e.scrollElement=null,e.eventsEnabled=!1,e))}function _t(t){return""!==t&&!isNaN(parseFloat(t))&&isFinite(t)}function bt(t,e){Object.keys(e).forEach((function(n){var i="";-1!==["width","height","top","right","bottom","left"].indexOf(n)&&_t(e[n])&&(i="px"),t.style[n]=e[n]+i}))}var yt=D&&/Firefox/i.test(navigator.userAgent);function wt(t,e,n){var i=lt(t,(function(t){return t.name===e})),o=!!i&&t.some((function(t){return t.name===n&&t.enabled&&t.order<i.order}));if(!o){var r="`"+e+"`",a="`"+n+"`";console.warn(a+" modifier is required by "+r+" modifier in order to work, be sure to include it before "+r+"!")}return o}var Et=["auto-start","auto","auto-end","top-start","top","top-end","right-start","right","right-end","bottom-end","bottom","bottom-start","left-end","left","left-start"],Tt=Et.slice(3);function Ct(t){var e=arguments.length>1&&void 0!==arguments[1]&&arguments[1],n=Tt.indexOf(t),i=Tt.slice(n+1).concat(Tt.slice(0,n));return e?i.reverse():i}var St="flip",Dt="clockwise",Nt="counterclockwise";function kt(t,e,n,i){var o=[0,0],r=-1!==["right","left"].indexOf(i),a=t.split(/(\+|\-)/).map((function(t){return t.trim()})),s=a.indexOf(lt(a,(function(t){return-1!==t.search(/,|\s/)})));a[s]&&-1===a[s].indexOf(",")&&console.warn("Offsets separated by white space(s) are deprecated, use a comma (,) instead.");var l=/\s*,\s*|\s+/,u=-1!==s?[a.slice(0,s).concat([a[s].split(l)[0]]),[a[s].split(l)[1]].concat(a.slice(s+1))]:[a];return(u=u.map((function(t,i){var o=(1===i?!r:r)?"height":"width",a=!1;return t.reduce((function(t,e){return""===t[t.length-1]&&-1!==["+","-"].indexOf(e)?(t[t.length-1]=e,a=!0,t):a?(t[t.length-1]+=e,a=!1,t):t.concat(e)}),[]).map((function(t){return function(t,e,n,i){var o=t.match(/((?:\-|\+)?\d*\.?\d*)(.*)/),r=+o[1],a=o[2];if(!r)return t;if(0===a.indexOf("%")){var s=void 0;switch(a){case"%p":s=n;break;case"%":case"%r":default:s=i}return K(s)[e]/100*r}if("vh"===a||"vw"===a)return("vh"===a?Math.max(document.documentElement.clientHeight,window.innerHeight||0):Math.max(document.documentElement.clientWidth,window.innerWidth||0))/100*r;return r}(t,o,e,n)}))}))).forEach((function(t,e){t.forEach((function(n,i){_t(n)&&(o[e]+=n*("-"===t[i-1]?-1:1))}))})),o}var At={placement:"bottom",positionFixed:!1,eventsEnabled:!0,removeOnDestroy:!1,onCreate:function(){},onUpdate:function(){},modifiers:{shift:{order:100,enabled:!0,fn:function(t){var e=t.placement,n=e.split("-")[0],i=e.split("-")[1];if(i){var o=t.offsets,r=o.reference,a=o.popper,s=-1!==["bottom","top"].indexOf(n),l=s?"left":"top",u=s?"width":"height",f={start:z({},l,r[l]),end:z({},l,r[l]+r[u]-a[u])};t.offsets.popper=X({},a,f[i])}return t}},offset:{order:200,enabled:!0,fn:function(t,e){var n=e.offset,i=t.placement,o=t.offsets,r=o.popper,a=o.reference,s=i.split("-")[0],l=void 0;return l=_t(+n)?[+n,0]:kt(n,r,a,s),"left"===s?(r.top+=l[0],r.left-=l[1]):"right"===s?(r.top+=l[0],r.left+=l[1]):"top"===s?(r.left+=l[0],r.top-=l[1]):"bottom"===s&&(r.left+=l[0],r.top+=l[1]),t.popper=r,t},offset:0},preventOverflow:{order:300,enabled:!0,fn:function(t,e){var n=e.boundariesElement||R(t.instance.popper);t.instance.reference===n&&(n=R(n));var i=ct("transform"),o=t.instance.popper.style,r=o.top,a=o.left,s=o[i];o.top="",o.left="",o[i]="";var l=et(t.instance.popper,t.instance.reference,e.padding,n,t.positionFixed);o.top=r,o.left=a,o[i]=s,e.boundaries=l;var u=e.priority,f=t.offsets.popper,d={primary:function(t){var n=f[t];return f[t]<l[t]&&!e.escapeWithReference&&(n=Math.max(f[t],l[t])),z({},t,n)},secondary:function(t){var n="right"===t?"left":"top",i=f[n];return f[t]>l[t]&&!e.escapeWithReference&&(i=Math.min(f[n],l[t]-("right"===t?f.width:f.height))),z({},n,i)}};return u.forEach((function(t){var e=-1!==["left","top"].indexOf(t)?"primary":"secondary";f=X({},f,d[e](t))})),t.offsets.popper=f,t},priority:["left","right","top","bottom"],padding:5,boundariesElement:"scrollParent"},keepTogether:{order:400,enabled:!0,fn:function(t){var e=t.offsets,n=e.popper,i=e.reference,o=t.placement.split("-")[0],r=Math.floor,a=-1!==["top","bottom"].indexOf(o),s=a?"right":"bottom",l=a?"left":"top",u=a?"width":"height";return n[s]<r(i[l])&&(t.offsets.popper[l]=r(i[l])-n[u]),n[l]>r(i[s])&&(t.offsets.popper[l]=r(i[s])),t}},arrow:{order:500,enabled:!0,fn:function(t,e){var n;if(!wt(t.instance.modifiers,"arrow","keepTogether"))return t;var i=e.element;if("string"==typeof i){if(!(i=t.instance.popper.querySelector(i)))return t}else if(!t.instance.popper.contains(i))return console.warn("WARNING: `arrow.element` must be child of its popper element!"),t;var o=t.placement.split("-")[0],r=t.offsets,a=r.popper,s=r.reference,l=-1!==["left","right"].indexOf(o),u=l?"height":"width",f=l?"Top":"Left",d=f.toLowerCase(),c=l?"left":"top",h=l?"bottom":"right",p=rt(i)[u];s[h]-p<a[d]&&(t.offsets.popper[d]-=a[d]-(s[h]-p)),s[d]+p>a[h]&&(t.offsets.popper[d]+=s[d]+p-a[h]),t.offsets.popper=K(t.offsets.popper);var m=s[d]+s[u]/2-p/2,g=I(t.instance.popper),v=parseFloat(g["margin"+f]),_=parseFloat(g["border"+f+"Width"]),b=m-t.offsets.popper[d]-v-_;return b=Math.max(Math.min(a[u]-p,b),0),t.arrowElement=i,t.offsets.arrow=(z(n={},d,Math.round(b)),z(n,c,""),n),t},element:"[x-arrow]"},flip:{order:600,enabled:!0,fn:function(t,e){if(dt(t.instance.modifiers,"inner"))return t;if(t.flipped&&t.placement===t.originalPlacement)return t;var n=et(t.instance.popper,t.instance.reference,e.padding,e.boundariesElement,t.positionFixed),i=t.placement.split("-")[0],o=at(i),r=t.placement.split("-")[1]||"",a=[];switch(e.behavior){case St:a=[i,o];break;case Dt:a=Ct(i);break;case Nt:a=Ct(i,!0);break;default:a=e.behavior}return a.forEach((function(s,l){if(i!==s||a.length===l+1)return t;i=t.placement.split("-")[0],o=at(i);var u=t.offsets.popper,f=t.offsets.reference,d=Math.floor,c="left"===i&&d(u.right)>d(f.left)||"right"===i&&d(u.left)<d(f.right)||"top"===i&&d(u.bottom)>d(f.top)||"bottom"===i&&d(u.top)<d(f.bottom),h=d(u.left)<d(n.left),p=d(u.right)>d(n.right),m=d(u.top)<d(n.top),g=d(u.bottom)>d(n.bottom),v="left"===i&&h||"right"===i&&p||"top"===i&&m||"bottom"===i&&g,_=-1!==["top","bottom"].indexOf(i),b=!!e.flipVariations&&(_&&"start"===r&&h||_&&"end"===r&&p||!_&&"start"===r&&m||!_&&"end"===r&&g),y=!!e.flipVariationsByContent&&(_&&"start"===r&&p||_&&"end"===r&&h||!_&&"start"===r&&g||!_&&"end"===r&&m),w=b||y;(c||v||w)&&(t.flipped=!0,(c||v)&&(i=a[l+1]),w&&(r=function(t){return"end"===t?"start":"start"===t?"end":t}(r)),t.placement=i+(r?"-"+r:""),t.offsets.popper=X({},t.offsets.popper,st(t.instance.popper,t.offsets.reference,t.placement)),t=ut(t.instance.modifiers,t,"flip"))})),t},behavior:"flip",padding:5,boundariesElement:"viewport",flipVariations:!1,flipVariationsByContent:!1},inner:{order:700,enabled:!1,fn:function(t){var e=t.placement,n=e.split("-")[0],i=t.offsets,o=i.popper,r=i.reference,a=-1!==["left","right"].indexOf(n),s=-1===["top","left"].indexOf(n);return o[a?"left":"top"]=r[n]-(s?o[a?"width":"height"]:0),t.placement=at(e),t.offsets.popper=K(o),t}},hide:{order:800,enabled:!0,fn:function(t){if(!wt(t.instance.modifiers,"hide","preventOverflow"))return t;var e=t.offsets.reference,n=lt(t.instance.modifiers,(function(t){return"preventOverflow"===t.name})).boundaries;if(e.bottom<n.top||e.left>n.right||e.top>n.bottom||e.right<n.left){if(!0===t.hide)return t;t.hide=!0,t.attributes["x-out-of-boundaries"]=""}else{if(!1===t.hide)return t;t.hide=!1,t.attributes["x-out-of-boundaries"]=!1}return t}},computeStyle:{order:850,enabled:!0,fn:function(t,e){var n=e.x,i=e.y,o=t.offsets.popper,r=lt(t.instance.modifiers,(function(t){return"applyStyle"===t.name})).gpuAcceleration;void 0!==r&&console.warn("WARNING: `gpuAcceleration` option moved to `computeStyle` modifier and will not be supported in future versions of Popper.js!");var a=void 0!==r?r:e.gpuAcceleration,s=R(t.instance.popper),l=G(s),u={position:o.position},f=function(t,e){var n=t.offsets,i=n.popper,o=n.reference,r=Math.round,a=Math.floor,s=function(t){return t},l=r(o.width),u=r(i.width),f=-1!==["left","right"].indexOf(t.placement),d=-1!==t.placement.indexOf("-"),c=e?f||d||l%2==u%2?r:a:s,h=e?r:s;return{left:c(l%2==1&&u%2==1&&!d&&e?i.left-1:i.left),top:h(i.top),bottom:h(i.bottom),right:c(i.right)}}(t,window.devicePixelRatio<2||!yt),d="bottom"===n?"top":"bottom",c="right"===i?"left":"right",h=ct("transform"),p=void 0,m=void 0;if(m="bottom"===d?"HTML"===s.nodeName?-s.clientHeight+f.bottom:-l.height+f.bottom:f.top,p="right"===c?"HTML"===s.nodeName?-s.clientWidth+f.right:-l.width+f.right:f.left,a&&h)u[h]="translate3d("+p+"px, "+m+"px, 0)",u[d]=0,u[c]=0,u.willChange="transform";else{var g="bottom"===d?-1:1,v="right"===c?-1:1;u[d]=m*g,u[c]=p*v,u.willChange=d+", "+c}var _={"x-placement":t.placement};return t.attributes=X({},_,t.attributes),t.styles=X({},u,t.styles),t.arrowStyles=X({},t.offsets.arrow,t.arrowStyles),t},gpuAcceleration:!0,x:"bottom",y:"right"},applyStyle:{order:900,enabled:!0,fn:function(t){var e,n;return bt(t.instance.popper,t.styles),e=t.instance.popper,n=t.attributes,Object.keys(n).forEach((function(t){!1!==n[t]?e.setAttribute(t,n[t]):e.removeAttribute(t)})),t.arrowElement&&Object.keys(t.arrowStyles).length&&bt(t.arrowElement,t.arrowStyles),t},onLoad:function(t,e,n,i,o){var r=ot(o,e,t,n.positionFixed),a=it(n.placement,r,e,t,n.modifiers.flip.boundariesElement,n.modifiers.flip.padding);return e.setAttribute("x-placement",a),bt(e,{position:n.positionFixed?"fixed":"absolute"}),n},gpuAcceleration:void 0}}},It=function(){function t(e,n){var i=this,o=arguments.length>2&&void 0!==arguments[2]?arguments[2]:{};V(this,t),this.scheduleUpdate=function(){return requestAnimationFrame(i.update)},this.update=k(this.update.bind(this)),this.options=X({},t.Defaults,o),this.state={isDestroyed:!1,isCreated:!1,scrollParents:[]},this.reference=e&&e.jquery?e[0]:e,this.popper=n&&n.jquery?n[0]:n,this.options.modifiers={},Object.keys(X({},t.Defaults.modifiers,o.modifiers)).forEach((function(e){i.options.modifiers[e]=X({},t.Defaults.modifiers[e]||{},o.modifiers?o.modifiers[e]:{})})),this.modifiers=Object.keys(this.options.modifiers).map((function(t){return X({name:t},i.options.modifiers[t])})).sort((function(t,e){return t.order-e.order})),this.modifiers.forEach((function(t){t.enabled&&A(t.onLoad)&&t.onLoad(i.reference,i.popper,i.options,t,i.state)})),this.update();var r=this.options.eventsEnabled;r&&this.enableEventListeners(),this.state.eventsEnabled=r}return Y(t,[{key:"update",value:function(){return ft.call(this)}},{key:"destroy",value:function(){return ht.call(this)}},{key:"enableEventListeners",value:function(){return gt.call(this)}},{key:"disableEventListeners",value:function(){return vt.call(this)}}]),t}();It.Utils=("undefined"!=typeof window?window:global).PopperUtils,It.placements=Et,It.Defaults=At;var Ot="dropdown",xt=i.default.fn[Ot],jt=new RegExp("38|40|27"),Lt={offset:0,flip:!0,boundary:"scrollParent",reference:"toggle",display:"dynamic",popperConfig:null},Pt={offset:"(number|string|function)",flip:"boolean",boundary:"(string|element)",reference:"(string|element)",display:"string",popperConfig:"(null|object)"},Ft=function(){function t(t,e){this._element=t,this._popper=null,this._config=this._getConfig(e),this._menu=this._getMenuElement(),this._inNavbar=this._detectNavbar(),this._addEventListeners()}var e=t.prototype;return e.toggle=function(){if(!this._element.disabled&&!i.default(this._element).hasClass("disabled")){var e=i.default(this._menu).hasClass("show");t._clearMenus(),e||this.show(!0)}},e.show=function(e){if(void 0===e&&(e=!1),!(this._element.disabled||i.default(this._element).hasClass("disabled")||i.default(this._menu).hasClass("show"))){var n={relatedTarget:this._element},o=i.default.Event("show.bs.dropdown",n),r=t._getParentFromElement(this._element);if(i.default(r).trigger(o),!o.isDefaultPrevented()){if(!this._inNavbar&&e){if("undefined"==typeof It)throw new TypeError("Bootstrap's dropdowns require Popper (https://popper.js.org)");var a=this._element;"parent"===this._config.reference?a=r:l.isElement(this._config.reference)&&(a=this._config.reference,"undefined"!=typeof this._config.reference.jquery&&(a=this._config.reference[0])),"scrollParent"!==this._config.boundary&&i.default(r).addClass("position-static"),this._popper=new It(a,this._menu,this._getPopperConfig())}"ontouchstart"in document.documentElement&&0===i.default(r).closest(".navbar-nav").length&&i.default(document.body).children().on("mouseover",null,i.default.noop),this._element.focus(),this._element.setAttribute("aria-expanded",!0),i.default(this._menu).toggleClass("show"),i.default(r).toggleClass("show").trigger(i.default.Event("shown.bs.dropdown",n))}}},e.hide=function(){if(!this._element.disabled&&!i.default(this._element).hasClass("disabled")&&i.default(this._menu).hasClass("show")){var e={relatedTarget:this._element},n=i.default.Event("hide.bs.dropdown",e),o=t._getParentFromElement(this._element);i.default(o).trigger(n),n.isDefaultPrevented()||(this._popper&&this._popper.destroy(),i.default(this._menu).toggleClass("show"),i.default(o).toggleClass("show").trigger(i.default.Event("hidden.bs.dropdown",e)))}},e.dispose=function(){i.default.removeData(this._element,"bs.dropdown"),i.default(this._element).off(".bs.dropdown"),this._element=null,this._menu=null,null!==this._popper&&(this._popper.destroy(),this._popper=null)},e.update=function(){this._inNavbar=this._detectNavbar(),null!==this._popper&&this._popper.scheduleUpdate()},e._addEventListeners=function(){var t=this;i.default(this._element).on("click.bs.dropdown",(function(e){e.preventDefault(),e.stopPropagation(),t.toggle()}))},e._getConfig=function(t){return t=a({},this.constructor.Default,i.default(this._element).data(),t),l.typeCheckConfig(Ot,t,this.constructor.DefaultType),t},e._getMenuElement=function(){if(!this._menu){var e=t._getParentFromElement(this._element);e&&(this._menu=e.querySelector(".dropdown-menu"))}return this._menu},e._getPlacement=function(){var t=i.default(this._element.parentNode),e="bottom-start";return t.hasClass("dropup")?e=i.default(this._menu).hasClass("dropdown-menu-right")?"top-end":"top-start":t.hasClass("dropright")?e="right-start":t.hasClass("dropleft")?e="left-start":i.default(this._menu).hasClass("dropdown-menu-right")&&(e="bottom-end"),e},e._detectNavbar=function(){return i.default(this._element).closest(".navbar").length>0},e._getOffset=function(){var t=this,e={};return"function"==typeof this._config.offset?e.fn=function(e){return e.offsets=a({},e.offsets,t._config.offset(e.offsets,t._element)||{}),e}:e.offset=this._config.offset,e},e._getPopperConfig=function(){var t={placement:this._getPlacement(),modifiers:{offset:this._getOffset(),flip:{enabled:this._config.flip},preventOverflow:{boundariesElement:this._config.boundary}}};return"static"===this._config.display&&(t.modifiers.applyStyle={enabled:!1}),a({},t,this._config.popperConfig)},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this).data("bs.dropdown");if(n||(n=new t(this,"object"==typeof e?e:null),i.default(this).data("bs.dropdown",n)),"string"==typeof e){if("undefined"==typeof n[e])throw new TypeError('No method named "'+e+'"');n[e]()}}))},t._clearMenus=function(e){if(!e||3!==e.which&&("keyup"!==e.type||9===e.which))for(var n=[].slice.call(document.querySelectorAll('[data-toggle="dropdown"]')),o=0,r=n.length;o<r;o++){var a=t._getParentFromElement(n[o]),s=i.default(n[o]).data("bs.dropdown"),l={relatedTarget:n[o]};if(e&&"click"===e.type&&(l.clickEvent=e),s){var u=s._menu;if(i.default(a).hasClass("show")&&!(e&&("click"===e.type&&/input|textarea/i.test(e.target.tagName)||"keyup"===e.type&&9===e.which)&&i.default.contains(a,e.target))){var f=i.default.Event("hide.bs.dropdown",l);i.default(a).trigger(f),f.isDefaultPrevented()||("ontouchstart"in document.documentElement&&i.default(document.body).children().off("mouseover",null,i.default.noop),n[o].setAttribute("aria-expanded","false"),s._popper&&s._popper.destroy(),i.default(u).removeClass("show"),i.default(a).removeClass("show").trigger(i.default.Event("hidden.bs.dropdown",l)))}}}},t._getParentFromElement=function(t){var e,n=l.getSelectorFromElement(t);return n&&(e=document.querySelector(n)),e||t.parentNode},t._dataApiKeydownHandler=function(e){if(!(/input|textarea/i.test(e.target.tagName)?32===e.which||27!==e.which&&(40!==e.which&&38!==e.which||i.default(e.target).closest(".dropdown-menu").length):!jt.test(e.which))&&!this.disabled&&!i.default(this).hasClass("disabled")){var n=t._getParentFromElement(this),o=i.default(n).hasClass("show");if(o||27!==e.which){if(e.preventDefault(),e.stopPropagation(),!o||27===e.which||32===e.which)return 27===e.which&&i.default(n.querySelector('[data-toggle="dropdown"]')).trigger("focus"),void i.default(this).trigger("click");var r=[].slice.call(n.querySelectorAll(".dropdown-menu .dropdown-item:not(.disabled):not(:disabled)")).filter((function(t){return i.default(t).is(":visible")}));if(0!==r.length){var a=r.indexOf(e.target);38===e.which&&a>0&&a--,40===e.which&&a<r.length-1&&a++,a<0&&(a=0),r[a].focus()}}}},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return Lt}},{key:"DefaultType",get:function(){return Pt}}]),t}();i.default(document).on("keydown.bs.dropdown.data-api",'[data-toggle="dropdown"]',Ft._dataApiKeydownHandler).on("keydown.bs.dropdown.data-api",".dropdown-menu",Ft._dataApiKeydownHandler).on("click.bs.dropdown.data-api keyup.bs.dropdown.data-api",Ft._clearMenus).on("click.bs.dropdown.data-api",'[data-toggle="dropdown"]',(function(t){t.preventDefault(),t.stopPropagation(),Ft._jQueryInterface.call(i.default(this),"toggle")})).on("click.bs.dropdown.data-api",".dropdown form",(function(t){t.stopPropagation()})),i.default.fn[Ot]=Ft._jQueryInterface,i.default.fn[Ot].Constructor=Ft,i.default.fn[Ot].noConflict=function(){return i.default.fn[Ot]=xt,Ft._jQueryInterface};var Rt=i.default.fn.modal,Ht={backdrop:!0,keyboard:!0,focus:!0,show:!0},Mt={backdrop:"(boolean|string)",keyboard:"boolean",focus:"boolean",show:"boolean"},qt=function(){function t(t,e){this._config=this._getConfig(e),this._element=t,this._dialog=t.querySelector(".modal-dialog"),this._backdrop=null,this._isShown=!1,this._isBodyOverflowing=!1,this._ignoreBackdropClick=!1,this._isTransitioning=!1,this._scrollbarWidth=0}var e=t.prototype;return e.toggle=function(t){return this._isShown?this.hide():this.show(t)},e.show=function(t){var e=this;if(!this._isShown&&!this._isTransitioning){i.default(this._element).hasClass("fade")&&(this._isTransitioning=!0);var n=i.default.Event("show.bs.modal",{relatedTarget:t});i.default(this._element).trigger(n),this._isShown||n.isDefaultPrevented()||(this._isShown=!0,this._checkScrollbar(),this._setScrollbar(),this._adjustDialog(),this._setEscapeEvent(),this._setResizeEvent(),i.default(this._element).on("click.dismiss.bs.modal",'[data-dismiss="modal"]',(function(t){return e.hide(t)})),i.default(this._dialog).on("mousedown.dismiss.bs.modal",(function(){i.default(e._element).one("mouseup.dismiss.bs.modal",(function(t){i.default(t.target).is(e._element)&&(e._ignoreBackdropClick=!0)}))})),this._showBackdrop((function(){return e._showElement(t)})))}},e.hide=function(t){var e=this;if(t&&t.preventDefault(),this._isShown&&!this._isTransitioning){var n=i.default.Event("hide.bs.modal");if(i.default(this._element).trigger(n),this._isShown&&!n.isDefaultPrevented()){this._isShown=!1;var o=i.default(this._element).hasClass("fade");if(o&&(this._isTransitioning=!0),this._setEscapeEvent(),this._setResizeEvent(),i.default(document).off("focusin.bs.modal"),i.default(this._element).removeClass("show"),i.default(this._element).off("click.dismiss.bs.modal"),i.default(this._dialog).off("mousedown.dismiss.bs.modal"),o){var r=l.getTransitionDurationFromElement(this._element);i.default(this._element).one(l.TRANSITION_END,(function(t){return e._hideModal(t)})).emulateTransitionEnd(r)}else this._hideModal()}}},e.dispose=function(){[window,this._element,this._dialog].forEach((function(t){return i.default(t).off(".bs.modal")})),i.default(document).off("focusin.bs.modal"),i.default.removeData(this._element,"bs.modal"),this._config=null,this._element=null,this._dialog=null,this._backdrop=null,this._isShown=null,this._isBodyOverflowing=null,this._ignoreBackdropClick=null,this._isTransitioning=null,this._scrollbarWidth=null},e.handleUpdate=function(){this._adjustDialog()},e._getConfig=function(t){return t=a({},Ht,t),l.typeCheckConfig("modal",t,Mt),t},e._triggerBackdropTransition=function(){var t=this,e=i.default.Event("hidePrevented.bs.modal");if(i.default(this._element).trigger(e),!e.isDefaultPrevented()){var n=this._element.scrollHeight>document.documentElement.clientHeight;n||(this._element.style.overflowY="hidden"),this._element.classList.add("modal-static");var o=l.getTransitionDurationFromElement(this._dialog);i.default(this._element).off(l.TRANSITION_END),i.default(this._element).one(l.TRANSITION_END,(function(){t._element.classList.remove("modal-static"),n||i.default(t._element).one(l.TRANSITION_END,(function(){t._element.style.overflowY=""})).emulateTransitionEnd(t._element,o)})).emulateTransitionEnd(o),this._element.focus()}},e._showElement=function(t){var e=this,n=i.default(this._element).hasClass("fade"),o=this._dialog?this._dialog.querySelector(".modal-body"):null;this._element.parentNode&&this._element.parentNode.nodeType===Node.ELEMENT_NODE||document.body.appendChild(this._element),this._element.style.display="block",this._element.removeAttribute("aria-hidden"),this._element.setAttribute("aria-modal",!0),this._element.setAttribute("role","dialog"),i.default(this._dialog).hasClass("modal-dialog-scrollable")&&o?o.scrollTop=0:this._element.scrollTop=0,n&&l.reflow(this._element),i.default(this._element).addClass("show"),this._config.focus&&this._enforceFocus();var r=i.default.Event("shown.bs.modal",{relatedTarget:t}),a=function(){e._config.focus&&e._element.focus(),e._isTransitioning=!1,i.default(e._element).trigger(r)};if(n){var s=l.getTransitionDurationFromElement(this._dialog);i.default(this._dialog).one(l.TRANSITION_END,a).emulateTransitionEnd(s)}else a()},e._enforceFocus=function(){var t=this;i.default(document).off("focusin.bs.modal").on("focusin.bs.modal",(function(e){document!==e.target&&t._element!==e.target&&0===i.default(t._element).has(e.target).length&&t._element.focus()}))},e._setEscapeEvent=function(){var t=this;this._isShown?i.default(this._element).on("keydown.dismiss.bs.modal",(function(e){t._config.keyboard&&27===e.which?(e.preventDefault(),t.hide()):t._config.keyboard||27!==e.which||t._triggerBackdropTransition()})):this._isShown||i.default(this._element).off("keydown.dismiss.bs.modal")},e._setResizeEvent=function(){var t=this;this._isShown?i.default(window).on("resize.bs.modal",(function(e){return t.handleUpdate(e)})):i.default(window).off("resize.bs.modal")},e._hideModal=function(){var t=this;this._element.style.display="none",this._element.setAttribute("aria-hidden",!0),this._element.removeAttribute("aria-modal"),this._element.removeAttribute("role"),this._isTransitioning=!1,this._showBackdrop((function(){i.default(document.body).removeClass("modal-open"),t._resetAdjustments(),t._resetScrollbar(),i.default(t._element).trigger("hidden.bs.modal")}))},e._removeBackdrop=function(){this._backdrop&&(i.default(this._backdrop).remove(),this._backdrop=null)},e._showBackdrop=function(t){var e=this,n=i.default(this._element).hasClass("fade")?"fade":"";if(this._isShown&&this._config.backdrop){if(this._backdrop=document.createElement("div"),this._backdrop.className="modal-backdrop",n&&this._backdrop.classList.add(n),i.default(this._backdrop).appendTo(document.body),i.default(this._element).on("click.dismiss.bs.modal",(function(t){e._ignoreBackdropClick?e._ignoreBackdropClick=!1:t.target===t.currentTarget&&("static"===e._config.backdrop?e._triggerBackdropTransition():e.hide())})),n&&l.reflow(this._backdrop),i.default(this._backdrop).addClass("show"),!t)return;if(!n)return void t();var o=l.getTransitionDurationFromElement(this._backdrop);i.default(this._backdrop).one(l.TRANSITION_END,t).emulateTransitionEnd(o)}else if(!this._isShown&&this._backdrop){i.default(this._backdrop).removeClass("show");var r=function(){e._removeBackdrop(),t&&t()};if(i.default(this._element).hasClass("fade")){var a=l.getTransitionDurationFromElement(this._backdrop);i.default(this._backdrop).one(l.TRANSITION_END,r).emulateTransitionEnd(a)}else r()}else t&&t()},e._adjustDialog=function(){var t=this._element.scrollHeight>document.documentElement.clientHeight;!this._isBodyOverflowing&&t&&(this._element.style.paddingLeft=this._scrollbarWidth+"px"),this._isBodyOverflowing&&!t&&(this._element.style.paddingRight=this._scrollbarWidth+"px")},e._resetAdjustments=function(){this._element.style.paddingLeft="",this._element.style.paddingRight=""},e._checkScrollbar=function(){var t=document.body.getBoundingClientRect();this._isBodyOverflowing=Math.round(t.left+t.right)<window.innerWidth,this._scrollbarWidth=this._getScrollbarWidth()},e._setScrollbar=function(){var t=this;if(this._isBodyOverflowing){var e=[].slice.call(document.querySelectorAll(".fixed-top, .fixed-bottom, .is-fixed, .sticky-top")),n=[].slice.call(document.querySelectorAll(".sticky-top"));i.default(e).each((function(e,n){var o=n.style.paddingRight,r=i.default(n).css("padding-right");i.default(n).data("padding-right",o).css("padding-right",parseFloat(r)+t._scrollbarWidth+"px")})),i.default(n).each((function(e,n){var o=n.style.marginRight,r=i.default(n).css("margin-right");i.default(n).data("margin-right",o).css("margin-right",parseFloat(r)-t._scrollbarWidth+"px")}));var o=document.body.style.paddingRight,r=i.default(document.body).css("padding-right");i.default(document.body).data("padding-right",o).css("padding-right",parseFloat(r)+this._scrollbarWidth+"px")}i.default(document.body).addClass("modal-open")},e._resetScrollbar=function(){var t=[].slice.call(document.querySelectorAll(".fixed-top, .fixed-bottom, .is-fixed, .sticky-top"));i.default(t).each((function(t,e){var n=i.default(e).data("padding-right");i.default(e).removeData("padding-right"),e.style.paddingRight=n||""}));var e=[].slice.call(document.querySelectorAll(".sticky-top"));i.default(e).each((function(t,e){var n=i.default(e).data("margin-right");"undefined"!=typeof n&&i.default(e).css("margin-right",n).removeData("margin-right")}));var n=i.default(document.body).data("padding-right");i.default(document.body).removeData("padding-right"),document.body.style.paddingRight=n||""},e._getScrollbarWidth=function(){var t=document.createElement("div");t.className="modal-scrollbar-measure",document.body.appendChild(t);var e=t.getBoundingClientRect().width-t.clientWidth;return document.body.removeChild(t),e},t._jQueryInterface=function(e,n){return this.each((function(){var o=i.default(this).data("bs.modal"),r=a({},Ht,i.default(this).data(),"object"==typeof e&&e?e:{});if(o||(o=new t(this,r),i.default(this).data("bs.modal",o)),"string"==typeof e){if("undefined"==typeof o[e])throw new TypeError('No method named "'+e+'"');o[e](n)}else r.show&&o.show(n)}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return Ht}}]),t}();i.default(document).on("click.bs.modal.data-api",'[data-toggle="modal"]',(function(t){var e,n=this,o=l.getSelectorFromElement(this);o&&(e=document.querySelector(o));var r=i.default(e).data("bs.modal")?"toggle":a({},i.default(e).data(),i.default(this).data());"A"!==this.tagName&&"AREA"!==this.tagName||t.preventDefault();var s=i.default(e).one("show.bs.modal",(function(t){t.isDefaultPrevented()||s.one("hidden.bs.modal",(function(){i.default(n).is(":visible")&&n.focus()}))}));qt._jQueryInterface.call(i.default(e),r,this)})),i.default.fn.modal=qt._jQueryInterface,i.default.fn.modal.Constructor=qt,i.default.fn.modal.noConflict=function(){return i.default.fn.modal=Rt,qt._jQueryInterface};var Bt=["background","cite","href","itemtype","longdesc","poster","src","xlink:href"],Qt={"*":["class","dir","id","lang","role",/^aria-[\w-]*$/i],a:["target","href","title","rel"],area:[],b:[],br:[],col:[],code:[],div:[],em:[],hr:[],h1:[],h2:[],h3:[],h4:[],h5:[],h6:[],i:[],img:["src","srcset","alt","title","width","height"],li:[],ol:[],p:[],pre:[],s:[],small:[],span:[],sub:[],sup:[],strong:[],u:[],ul:[]},Wt=/^(?:(?:https?|mailto|ftp|tel|file):|[^#&/:?]*(?:[#/?]|$))/gi,Ut=/^data:(?:image\/(?:bmp|gif|jpeg|jpg|png|tiff|webp)|video\/(?:mpeg|mp4|ogg|webm)|audio\/(?:mp3|oga|ogg|opus));base64,[\d+/a-z]+=*$/i;function Vt(t,e,n){if(0===t.length)return t;if(n&&"function"==typeof n)return n(t);for(var i=(new window.DOMParser).parseFromString(t,"text/html"),o=Object.keys(e),r=[].slice.call(i.body.querySelectorAll("*")),a=function(t,n){var i=r[t],a=i.nodeName.toLowerCase();if(-1===o.indexOf(i.nodeName.toLowerCase()))return i.parentNode.removeChild(i),"continue";var s=[].slice.call(i.attributes),l=[].concat(e["*"]||[],e[a]||[]);s.forEach((function(t){(function(t,e){var n=t.nodeName.toLowerCase();if(-1!==e.indexOf(n))return-1===Bt.indexOf(n)||Boolean(t.nodeValue.match(Wt)||t.nodeValue.match(Ut));for(var i=e.filter((function(t){return t instanceof RegExp})),o=0,r=i.length;o<r;o++)if(n.match(i[o]))return!0;return!1})(t,l)||i.removeAttribute(t.nodeName)}))},s=0,l=r.length;s<l;s++)a(s);return i.body.innerHTML}var Yt="tooltip",zt=i.default.fn[Yt],Xt=new RegExp("(^|\\s)bs-tooltip\\S+","g"),Kt=["sanitize","whiteList","sanitizeFn"],Gt={animation:"boolean",template:"string",title:"(string|element|function)",trigger:"string",delay:"(number|object)",html:"boolean",selector:"(string|boolean)",placement:"(string|function)",offset:"(number|string|function)",container:"(string|element|boolean)",fallbackPlacement:"(string|array)",boundary:"(string|element)",customClass:"(string|function)",sanitize:"boolean",sanitizeFn:"(null|function)",whiteList:"object",popperConfig:"(null|object)"},$t={AUTO:"auto",TOP:"top",RIGHT:"right",BOTTOM:"bottom",LEFT:"left"},Jt={animation:!0,template:'<div class="tooltip" role="tooltip"><div class="arrow"></div><div class="tooltip-inner"></div></div>',trigger:"hover focus",title:"",delay:0,html:!1,selector:!1,placement:"top",offset:0,container:!1,fallbackPlacement:"flip",boundary:"scrollParent",customClass:"",sanitize:!0,sanitizeFn:null,whiteList:Qt,popperConfig:null},Zt={HIDE:"hide.bs.tooltip",HIDDEN:"hidden.bs.tooltip",SHOW:"show.bs.tooltip",SHOWN:"shown.bs.tooltip",INSERTED:"inserted.bs.tooltip",CLICK:"click.bs.tooltip",FOCUSIN:"focusin.bs.tooltip",FOCUSOUT:"focusout.bs.tooltip",MOUSEENTER:"mouseenter.bs.tooltip",MOUSELEAVE:"mouseleave.bs.tooltip"},te=function(){function t(t,e){if("undefined"==typeof It)throw new TypeError("Bootstrap's tooltips require Popper (https://popper.js.org)");this._isEnabled=!0,this._timeout=0,this._hoverState="",this._activeTrigger={},this._popper=null,this.element=t,this.config=this._getConfig(e),this.tip=null,this._setListeners()}var e=t.prototype;return e.enable=function(){this._isEnabled=!0},e.disable=function(){this._isEnabled=!1},e.toggleEnabled=function(){this._isEnabled=!this._isEnabled},e.toggle=function(t){if(this._isEnabled)if(t){var e=this.constructor.DATA_KEY,n=i.default(t.currentTarget).data(e);n||(n=new this.constructor(t.currentTarget,this._getDelegateConfig()),i.default(t.currentTarget).data(e,n)),n._activeTrigger.click=!n._activeTrigger.click,n._isWithActiveTrigger()?n._enter(null,n):n._leave(null,n)}else{if(i.default(this.getTipElement()).hasClass("show"))return void this._leave(null,this);this._enter(null,this)}},e.dispose=function(){clearTimeout(this._timeout),i.default.removeData(this.element,this.constructor.DATA_KEY),i.default(this.element).off(this.constructor.EVENT_KEY),i.default(this.element).closest(".modal").off("hide.bs.modal",this._hideModalHandler),this.tip&&i.default(this.tip).remove(),this._isEnabled=null,this._timeout=null,this._hoverState=null,this._activeTrigger=null,this._popper&&this._popper.destroy(),this._popper=null,this.element=null,this.config=null,this.tip=null},e.show=function(){var t=this;if("none"===i.default(this.element).css("display"))throw new Error("Please use show on visible elements");var e=i.default.Event(this.constructor.Event.SHOW);if(this.isWithContent()&&this._isEnabled){i.default(this.element).trigger(e);var n=l.findShadowRoot(this.element),o=i.default.contains(null!==n?n:this.element.ownerDocument.documentElement,this.element);if(e.isDefaultPrevented()||!o)return;var r=this.getTipElement(),a=l.getUID(this.constructor.NAME);r.setAttribute("id",a),this.element.setAttribute("aria-describedby",a),this.setContent(),this.config.animation&&i.default(r).addClass("fade");var s="function"==typeof this.config.placement?this.config.placement.call(this,r,this.element):this.config.placement,u=this._getAttachment(s);this.addAttachmentClass(u);var f=this._getContainer();i.default(r).data(this.constructor.DATA_KEY,this),i.default.contains(this.element.ownerDocument.documentElement,this.tip)||i.default(r).appendTo(f),i.default(this.element).trigger(this.constructor.Event.INSERTED),this._popper=new It(this.element,r,this._getPopperConfig(u)),i.default(r).addClass("show"),i.default(r).addClass(this.config.customClass),"ontouchstart"in document.documentElement&&i.default(document.body).children().on("mouseover",null,i.default.noop);var d=function(){t.config.animation&&t._fixTransition();var e=t._hoverState;t._hoverState=null,i.default(t.element).trigger(t.constructor.Event.SHOWN),"out"===e&&t._leave(null,t)};if(i.default(this.tip).hasClass("fade")){var c=l.getTransitionDurationFromElement(this.tip);i.default(this.tip).one(l.TRANSITION_END,d).emulateTransitionEnd(c)}else d()}},e.hide=function(t){var e=this,n=this.getTipElement(),o=i.default.Event(this.constructor.Event.HIDE),r=function(){"show"!==e._hoverState&&n.parentNode&&n.parentNode.removeChild(n),e._cleanTipClass(),e.element.removeAttribute("aria-describedby"),i.default(e.element).trigger(e.constructor.Event.HIDDEN),null!==e._popper&&e._popper.destroy(),t&&t()};if(i.default(this.element).trigger(o),!o.isDefaultPrevented()){if(i.default(n).removeClass("show"),"ontouchstart"in document.documentElement&&i.default(document.body).children().off("mouseover",null,i.default.noop),this._activeTrigger.click=!1,this._activeTrigger.focus=!1,this._activeTrigger.hover=!1,i.default(this.tip).hasClass("fade")){var a=l.getTransitionDurationFromElement(n);i.default(n).one(l.TRANSITION_END,r).emulateTransitionEnd(a)}else r();this._hoverState=""}},e.update=function(){null!==this._popper&&this._popper.scheduleUpdate()},e.isWithContent=function(){return Boolean(this.getTitle())},e.addAttachmentClass=function(t){i.default(this.getTipElement()).addClass("bs-tooltip-"+t)},e.getTipElement=function(){return this.tip=this.tip||i.default(this.config.template)[0],this.tip},e.setContent=function(){var t=this.getTipElement();this.setElementContent(i.default(t.querySelectorAll(".tooltip-inner")),this.getTitle()),i.default(t).removeClass("fade show")},e.setElementContent=function(t,e){"object"!=typeof e||!e.nodeType&&!e.jquery?this.config.html?(this.config.sanitize&&(e=Vt(e,this.config.whiteList,this.config.sanitizeFn)),t.html(e)):t.text(e):this.config.html?i.default(e).parent().is(t)||t.empty().append(e):t.text(i.default(e).text())},e.getTitle=function(){var t=this.element.getAttribute("data-original-title");return t||(t="function"==typeof this.config.title?this.config.title.call(this.element):this.config.title),t},e._getPopperConfig=function(t){var e=this;return a({},{placement:t,modifiers:{offset:this._getOffset(),flip:{behavior:this.config.fallbackPlacement},arrow:{element:".arrow"},preventOverflow:{boundariesElement:this.config.boundary}},onCreate:function(t){t.originalPlacement!==t.placement&&e._handlePopperPlacementChange(t)},onUpdate:function(t){return e._handlePopperPlacementChange(t)}},this.config.popperConfig)},e._getOffset=function(){var t=this,e={};return"function"==typeof this.config.offset?e.fn=function(e){return e.offsets=a({},e.offsets,t.config.offset(e.offsets,t.element)||{}),e}:e.offset=this.config.offset,e},e._getContainer=function(){return!1===this.config.container?document.body:l.isElement(this.config.container)?i.default(this.config.container):i.default(document).find(this.config.container)},e._getAttachment=function(t){return $t[t.toUpperCase()]},e._setListeners=function(){var t=this;this.config.trigger.split(" ").forEach((function(e){if("click"===e)i.default(t.element).on(t.constructor.Event.CLICK,t.config.selector,(function(e){return t.toggle(e)}));else if("manual"!==e){var n="hover"===e?t.constructor.Event.MOUSEENTER:t.constructor.Event.FOCUSIN,o="hover"===e?t.constructor.Event.MOUSELEAVE:t.constructor.Event.FOCUSOUT;i.default(t.element).on(n,t.config.selector,(function(e){return t._enter(e)})).on(o,t.config.selector,(function(e){return t._leave(e)}))}})),this._hideModalHandler=function(){t.element&&t.hide()},i.default(this.element).closest(".modal").on("hide.bs.modal",this._hideModalHandler),this.config.selector?this.config=a({},this.config,{trigger:"manual",selector:""}):this._fixTitle()},e._fixTitle=function(){var t=typeof this.element.getAttribute("data-original-title");(this.element.getAttribute("title")||"string"!==t)&&(this.element.setAttribute("data-original-title",this.element.getAttribute("title")||""),this.element.setAttribute("title",""))},e._enter=function(t,e){var n=this.constructor.DATA_KEY;(e=e||i.default(t.currentTarget).data(n))||(e=new this.constructor(t.currentTarget,this._getDelegateConfig()),i.default(t.currentTarget).data(n,e)),t&&(e._activeTrigger["focusin"===t.type?"focus":"hover"]=!0),i.default(e.getTipElement()).hasClass("show")||"show"===e._hoverState?e._hoverState="show":(clearTimeout(e._timeout),e._hoverState="show",e.config.delay&&e.config.delay.show?e._timeout=setTimeout((function(){"show"===e._hoverState&&e.show()}),e.config.delay.show):e.show())},e._leave=function(t,e){var n=this.constructor.DATA_KEY;(e=e||i.default(t.currentTarget).data(n))||(e=new this.constructor(t.currentTarget,this._getDelegateConfig()),i.default(t.currentTarget).data(n,e)),t&&(e._activeTrigger["focusout"===t.type?"focus":"hover"]=!1),e._isWithActiveTrigger()||(clearTimeout(e._timeout),e._hoverState="out",e.config.delay&&e.config.delay.hide?e._timeout=setTimeout((function(){"out"===e._hoverState&&e.hide()}),e.config.delay.hide):e.hide())},e._isWithActiveTrigger=function(){for(var t in this._activeTrigger)if(this._activeTrigger[t])return!0;return!1},e._getConfig=function(t){var e=i.default(this.element).data();return Object.keys(e).forEach((function(t){-1!==Kt.indexOf(t)&&delete e[t]})),"number"==typeof(t=a({},this.constructor.Default,e,"object"==typeof t&&t?t:{})).delay&&(t.delay={show:t.delay,hide:t.delay}),"number"==typeof t.title&&(t.title=t.title.toString()),"number"==typeof t.content&&(t.content=t.content.toString()),l.typeCheckConfig(Yt,t,this.constructor.DefaultType),t.sanitize&&(t.template=Vt(t.template,t.whiteList,t.sanitizeFn)),t},e._getDelegateConfig=function(){var t={};if(this.config)for(var e in this.config)this.constructor.Default[e]!==this.config[e]&&(t[e]=this.config[e]);return t},e._cleanTipClass=function(){var t=i.default(this.getTipElement()),e=t.attr("class").match(Xt);null!==e&&e.length&&t.removeClass(e.join(""))},e._handlePopperPlacementChange=function(t){this.tip=t.instance.popper,this._cleanTipClass(),this.addAttachmentClass(this._getAttachment(t.placement))},e._fixTransition=function(){var t=this.getTipElement(),e=this.config.animation;null===t.getAttribute("x-placement")&&(i.default(t).removeClass("fade"),this.config.animation=!1,this.hide(),this.show(),this.config.animation=e)},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this),o=n.data("bs.tooltip"),r="object"==typeof e&&e;if((o||!/dispose|hide/.test(e))&&(o||(o=new t(this,r),n.data("bs.tooltip",o)),"string"==typeof e)){if("undefined"==typeof o[e])throw new TypeError('No method named "'+e+'"');o[e]()}}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return Jt}},{key:"NAME",get:function(){return Yt}},{key:"DATA_KEY",get:function(){return"bs.tooltip"}},{key:"Event",get:function(){return Zt}},{key:"EVENT_KEY",get:function(){return".bs.tooltip"}},{key:"DefaultType",get:function(){return Gt}}]),t}();i.default.fn[Yt]=te._jQueryInterface,i.default.fn[Yt].Constructor=te,i.default.fn[Yt].noConflict=function(){return i.default.fn[Yt]=zt,te._jQueryInterface};var ee="popover",ne=i.default.fn[ee],ie=new RegExp("(^|\\s)bs-popover\\S+","g"),oe=a({},te.Default,{placement:"right",trigger:"click",content:"",template:'<div class="popover" role="tooltip"><div class="arrow"></div><h3 class="popover-header"></h3><div class="popover-body"></div></div>'}),re=a({},te.DefaultType,{content:"(string|element|function)"}),ae={HIDE:"hide.bs.popover",HIDDEN:"hidden.bs.popover",SHOW:"show.bs.popover",SHOWN:"shown.bs.popover",INSERTED:"inserted.bs.popover",CLICK:"click.bs.popover",FOCUSIN:"focusin.bs.popover",FOCUSOUT:"focusout.bs.popover",MOUSEENTER:"mouseenter.bs.popover",MOUSELEAVE:"mouseleave.bs.popover"},se=function(t){var e,n;function o(){return t.apply(this,arguments)||this}n=t,(e=o).prototype=Object.create(n.prototype),e.prototype.constructor=e,e.__proto__=n;var a=o.prototype;return a.isWithContent=function(){return this.getTitle()||this._getContent()},a.addAttachmentClass=function(t){i.default(this.getTipElement()).addClass("bs-popover-"+t)},a.getTipElement=function(){return this.tip=this.tip||i.default(this.config.template)[0],this.tip},a.setContent=function(){var t=i.default(this.getTipElement());this.setElementContent(t.find(".popover-header"),this.getTitle());var e=this._getContent();"function"==typeof e&&(e=e.call(this.element)),this.setElementContent(t.find(".popover-body"),e),t.removeClass("fade show")},a._getContent=function(){return this.element.getAttribute("data-content")||this.config.content},a._cleanTipClass=function(){var t=i.default(this.getTipElement()),e=t.attr("class").match(ie);null!==e&&e.length>0&&t.removeClass(e.join(""))},o._jQueryInterface=function(t){return this.each((function(){var e=i.default(this).data("bs.popover"),n="object"==typeof t?t:null;if((e||!/dispose|hide/.test(t))&&(e||(e=new o(this,n),i.default(this).data("bs.popover",e)),"string"==typeof t)){if("undefined"==typeof e[t])throw new TypeError('No method named "'+t+'"');e[t]()}}))},r(o,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return oe}},{key:"NAME",get:function(){return ee}},{key:"DATA_KEY",get:function(){return"bs.popover"}},{key:"Event",get:function(){return ae}},{key:"EVENT_KEY",get:function(){return".bs.popover"}},{key:"DefaultType",get:function(){return re}}]),o}(te);i.default.fn[ee]=se._jQueryInterface,i.default.fn[ee].Constructor=se,i.default.fn[ee].noConflict=function(){return i.default.fn[ee]=ne,se._jQueryInterface};var le="scrollspy",ue=i.default.fn[le],fe={offset:10,method:"auto",target:""},de={offset:"number",method:"string",target:"(string|element)"},ce=function(){function t(t,e){var n=this;this._element=t,this._scrollElement="BODY"===t.tagName?window:t,this._config=this._getConfig(e),this._selector=this._config.target+" .nav-link,"+this._config.target+" .list-group-item,"+this._config.target+" .dropdown-item",this._offsets=[],this._targets=[],this._activeTarget=null,this._scrollHeight=0,i.default(this._scrollElement).on("scroll.bs.scrollspy",(function(t){return n._process(t)})),this.refresh(),this._process()}var e=t.prototype;return e.refresh=function(){var t=this,e=this._scrollElement===this._scrollElement.window?"offset":"position",n="auto"===this._config.method?e:this._config.method,o="position"===n?this._getScrollTop():0;this._offsets=[],this._targets=[],this._scrollHeight=this._getScrollHeight(),[].slice.call(document.querySelectorAll(this._selector)).map((function(t){var e,r=l.getSelectorFromElement(t);if(r&&(e=document.querySelector(r)),e){var a=e.getBoundingClientRect();if(a.width||a.height)return[i.default(e)[n]().top+o,r]}return null})).filter((function(t){return t})).sort((function(t,e){return t[0]-e[0]})).forEach((function(e){t._offsets.push(e[0]),t._targets.push(e[1])}))},e.dispose=function(){i.default.removeData(this._element,"bs.scrollspy"),i.default(this._scrollElement).off(".bs.scrollspy"),this._element=null,this._scrollElement=null,this._config=null,this._selector=null,this._offsets=null,this._targets=null,this._activeTarget=null,this._scrollHeight=null},e._getConfig=function(t){if("string"!=typeof(t=a({},fe,"object"==typeof t&&t?t:{})).target&&l.isElement(t.target)){var e=i.default(t.target).attr("id");e||(e=l.getUID(le),i.default(t.target).attr("id",e)),t.target="#"+e}return l.typeCheckConfig(le,t,de),t},e._getScrollTop=function(){return this._scrollElement===window?this._scrollElement.pageYOffset:this._scrollElement.scrollTop},e._getScrollHeight=function(){return this._scrollElement.scrollHeight||Math.max(document.body.scrollHeight,document.documentElement.scrollHeight)},e._getOffsetHeight=function(){return this._scrollElement===window?window.innerHeight:this._scrollElement.getBoundingClientRect().height},e._process=function(){var t=this._getScrollTop()+this._config.offset,e=this._getScrollHeight(),n=this._config.offset+e-this._getOffsetHeight();if(this._scrollHeight!==e&&this.refresh(),t>=n){var i=this._targets[this._targets.length-1];this._activeTarget!==i&&this._activate(i)}else{if(this._activeTarget&&t<this._offsets[0]&&this._offsets[0]>0)return this._activeTarget=null,void this._clear();for(var o=this._offsets.length;o--;){this._activeTarget!==this._targets[o]&&t>=this._offsets[o]&&("undefined"==typeof this._offsets[o+1]||t<this._offsets[o+1])&&this._activate(this._targets[o])}}},e._activate=function(t){this._activeTarget=t,this._clear();var e=this._selector.split(",").map((function(e){return e+'[data-target="'+t+'"],'+e+'[href="'+t+'"]'})),n=i.default([].slice.call(document.querySelectorAll(e.join(","))));n.hasClass("dropdown-item")?(n.closest(".dropdown").find(".dropdown-toggle").addClass("active"),n.addClass("active")):(n.addClass("active"),n.parents(".nav, .list-group").prev(".nav-link, .list-group-item").addClass("active"),n.parents(".nav, .list-group").prev(".nav-item").children(".nav-link").addClass("active")),i.default(this._scrollElement).trigger("activate.bs.scrollspy",{relatedTarget:t})},e._clear=function(){[].slice.call(document.querySelectorAll(this._selector)).filter((function(t){return t.classList.contains("active")})).forEach((function(t){return t.classList.remove("active")}))},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this).data("bs.scrollspy");if(n||(n=new t(this,"object"==typeof e&&e),i.default(this).data("bs.scrollspy",n)),"string"==typeof e){if("undefined"==typeof n[e])throw new TypeError('No method named "'+e+'"');n[e]()}}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"Default",get:function(){return fe}}]),t}();i.default(window).on("load.bs.scrollspy.data-api",(function(){for(var t=[].slice.call(document.querySelectorAll('[data-spy="scroll"]')),e=t.length;e--;){var n=i.default(t[e]);ce._jQueryInterface.call(n,n.data())}})),i.default.fn[le]=ce._jQueryInterface,i.default.fn[le].Constructor=ce,i.default.fn[le].noConflict=function(){return i.default.fn[le]=ue,ce._jQueryInterface};var he=i.default.fn.tab,pe=function(){function t(t){this._element=t}var e=t.prototype;return e.show=function(){var t=this;if(!(this._element.parentNode&&this._element.parentNode.nodeType===Node.ELEMENT_NODE&&i.default(this._element).hasClass("active")||i.default(this._element).hasClass("disabled"))){var e,n,o=i.default(this._element).closest(".nav, .list-group")[0],r=l.getSelectorFromElement(this._element);if(o){var a="UL"===o.nodeName||"OL"===o.nodeName?"> li > .active":".active";n=(n=i.default.makeArray(i.default(o).find(a)))[n.length-1]}var s=i.default.Event("hide.bs.tab",{relatedTarget:this._element}),u=i.default.Event("show.bs.tab",{relatedTarget:n});if(n&&i.default(n).trigger(s),i.default(this._element).trigger(u),!u.isDefaultPrevented()&&!s.isDefaultPrevented()){r&&(e=document.querySelector(r)),this._activate(this._element,o);var f=function(){var e=i.default.Event("hidden.bs.tab",{relatedTarget:t._element}),o=i.default.Event("shown.bs.tab",{relatedTarget:n});i.default(n).trigger(e),i.default(t._element).trigger(o)};e?this._activate(e,e.parentNode,f):f()}}},e.dispose=function(){i.default.removeData(this._element,"bs.tab"),this._element=null},e._activate=function(t,e,n){var o=this,r=(!e||"UL"!==e.nodeName&&"OL"!==e.nodeName?i.default(e).children(".active"):i.default(e).find("> li > .active"))[0],a=n&&r&&i.default(r).hasClass("fade"),s=function(){return o._transitionComplete(t,r,n)};if(r&&a){var u=l.getTransitionDurationFromElement(r);i.default(r).removeClass("show").one(l.TRANSITION_END,s).emulateTransitionEnd(u)}else s()},e._transitionComplete=function(t,e,n){if(e){i.default(e).removeClass("active");var o=i.default(e.parentNode).find("> .dropdown-menu .active")[0];o&&i.default(o).removeClass("active"),"tab"===e.getAttribute("role")&&e.setAttribute("aria-selected",!1)}if(i.default(t).addClass("active"),"tab"===t.getAttribute("role")&&t.setAttribute("aria-selected",!0),l.reflow(t),t.classList.contains("fade")&&t.classList.add("show"),t.parentNode&&i.default(t.parentNode).hasClass("dropdown-menu")){var r=i.default(t).closest(".dropdown")[0];if(r){var a=[].slice.call(r.querySelectorAll(".dropdown-toggle"));i.default(a).addClass("active")}t.setAttribute("aria-expanded",!0)}n&&n()},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this),o=n.data("bs.tab");if(o||(o=new t(this),n.data("bs.tab",o)),"string"==typeof e){if("undefined"==typeof o[e])throw new TypeError('No method named "'+e+'"');o[e]()}}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}}]),t}();i.default(document).on("click.bs.tab.data-api",'[data-toggle="tab"], [data-toggle="pill"], [data-toggle="list"]',(function(t){t.preventDefault(),pe._jQueryInterface.call(i.default(this),"show")})),i.default.fn.tab=pe._jQueryInterface,i.default.fn.tab.Constructor=pe,i.default.fn.tab.noConflict=function(){return i.default.fn.tab=he,pe._jQueryInterface};var me=i.default.fn.toast,ge={animation:"boolean",autohide:"boolean",delay:"number"},ve={animation:!0,autohide:!0,delay:500},_e=function(){function t(t,e){this._element=t,this._config=this._getConfig(e),this._timeout=null,this._setListeners()}var e=t.prototype;return e.show=function(){var t=this,e=i.default.Event("show.bs.toast");if(i.default(this._element).trigger(e),!e.isDefaultPrevented()){this._clearTimeout(),this._config.animation&&this._element.classList.add("fade");var n=function(){t._element.classList.remove("showing"),t._element.classList.add("show"),i.default(t._element).trigger("shown.bs.toast"),t._config.autohide&&(t._timeout=setTimeout((function(){t.hide()}),t._config.delay))};if(this._element.classList.remove("hide"),l.reflow(this._element),this._element.classList.add("showing"),this._config.animation){var o=l.getTransitionDurationFromElement(this._element);i.default(this._element).one(l.TRANSITION_END,n).emulateTransitionEnd(o)}else n()}},e.hide=function(){if(this._element.classList.contains("show")){var t=i.default.Event("hide.bs.toast");i.default(this._element).trigger(t),t.isDefaultPrevented()||this._close()}},e.dispose=function(){this._clearTimeout(),this._element.classList.contains("show")&&this._element.classList.remove("show"),i.default(this._element).off("click.dismiss.bs.toast"),i.default.removeData(this._element,"bs.toast"),this._element=null,this._config=null},e._getConfig=function(t){return t=a({},ve,i.default(this._element).data(),"object"==typeof t&&t?t:{}),l.typeCheckConfig("toast",t,this.constructor.DefaultType),t},e._setListeners=function(){var t=this;i.default(this._element).on("click.dismiss.bs.toast",'[data-dismiss="toast"]',(function(){return t.hide()}))},e._close=function(){var t=this,e=function(){t._element.classList.add("hide"),i.default(t._element).trigger("hidden.bs.toast")};if(this._element.classList.remove("show"),this._config.animation){var n=l.getTransitionDurationFromElement(this._element);i.default(this._element).one(l.TRANSITION_END,e).emulateTransitionEnd(n)}else e()},e._clearTimeout=function(){clearTimeout(this._timeout),this._timeout=null},t._jQueryInterface=function(e){return this.each((function(){var n=i.default(this),o=n.data("bs.toast");if(o||(o=new t(this,"object"==typeof e&&e),n.data("bs.toast",o)),"string"==typeof e){if("undefined"==typeof o[e])throw new TypeError('No method named "'+e+'"');o[e](this)}}))},r(t,null,[{key:"VERSION",get:function(){return"4.6.0"}},{key:"DefaultType",get:function(){return ge}},{key:"Default",get:function(){return ve}}]),t}();i.default.fn.toast=_e._jQueryInterface,i.default.fn.toast.Constructor=_e,i.default.fn.toast.noConflict=function(){return i.default.fn.toast=me,_e._jQueryInterface},t.Alert=d,t.Button=h,t.Carousel=y,t.Collapse=S,t.Dropdown=Ft,t.Modal=qt,t.Popover=se,t.Scrollspy=ce,t.Tab=pe,t.Toast=_e,t.Tooltip=te,t.Util=l,Object.defineProperty(t,"__esModule",{value:!0})}));
diff --git a/js/_vendor/medium-zoom.esm.js b/js/_vendor/medium-zoom.esm.js
new file mode 100644
index 00000000..fa2b3776
--- /dev/null
+++ b/js/_vendor/medium-zoom.esm.js
@@ -0,0 +1,622 @@
+/*! medium-zoom 1.0.6 | MIT License | https://github.com/francoischalifour/medium-zoom */
+var _extends = Object.assign || function (target) {
+  for (var i = 1; i < arguments.length; i++) {
+    var source = arguments[i];
+
+    for (var key in source) {
+      if (Object.prototype.hasOwnProperty.call(source, key)) {
+        target[key] = source[key];
+      }
+    }
+  }
+
+  return target;
+};
+
+var isSupported = function isSupported(node) {
+  return node.tagName === 'IMG';
+};
+
+/* eslint-disable-next-line no-prototype-builtins */
+var isNodeList = function isNodeList(selector) {
+  return NodeList.prototype.isPrototypeOf(selector);
+};
+
+var isNode = function isNode(selector) {
+  return selector && selector.nodeType === 1;
+};
+
+var isSvg = function isSvg(image) {
+  var source = image.currentSrc || image.src;
+  return source.substr(-4).toLowerCase() === '.svg';
+};
+
+var getImagesFromSelector = function getImagesFromSelector(selector) {
+  try {
+    if (Array.isArray(selector)) {
+      return selector.filter(isSupported);
+    }
+
+    if (isNodeList(selector)) {
+      // Do not use spread operator or Array.from() for IE support
+      return [].slice.call(selector).filter(isSupported);
+    }
+
+    if (isNode(selector)) {
+      return [selector].filter(isSupported);
+    }
+
+    if (typeof selector === 'string') {
+      // Do not use spread operator or Array.from() for IE support
+      return [].slice.call(document.querySelectorAll(selector)).filter(isSupported);
+    }
+
+    return [];
+  } catch (err) {
+    throw new TypeError('The provided selector is invalid.\n' + 'Expects a CSS selector, a Node element, a NodeList or an array.\n' + 'See: https://github.com/francoischalifour/medium-zoom');
+  }
+};
+
+var createOverlay = function createOverlay(background) {
+  var overlay = document.createElement('div');
+  overlay.classList.add('medium-zoom-overlay');
+  overlay.style.background = background;
+
+  return overlay;
+};
+
+var cloneTarget = function cloneTarget(template) {
+  var _template$getBounding = template.getBoundingClientRect(),
+      top = _template$getBounding.top,
+      left = _template$getBounding.left,
+      width = _template$getBounding.width,
+      height = _template$getBounding.height;
+
+  var clone = template.cloneNode();
+  var scrollTop = window.pageYOffset || document.documentElement.scrollTop || document.body.scrollTop || 0;
+  var scrollLeft = window.pageXOffset || document.documentElement.scrollLeft || document.body.scrollLeft || 0;
+
+  clone.removeAttribute('id');
+  clone.style.position = 'absolute';
+  clone.style.top = top + scrollTop + 'px';
+  clone.style.left = left + scrollLeft + 'px';
+  clone.style.width = width + 'px';
+  clone.style.height = height + 'px';
+  clone.style.transform = '';
+
+  return clone;
+};
+
+var createCustomEvent = function createCustomEvent(type, params) {
+  var eventParams = _extends({
+    bubbles: false,
+    cancelable: false,
+    detail: undefined
+  }, params);
+
+  if (typeof window.CustomEvent === 'function') {
+    return new CustomEvent(type, eventParams);
+  }
+
+  var customEvent = document.createEvent('CustomEvent');
+  customEvent.initCustomEvent(type, eventParams.bubbles, eventParams.cancelable, eventParams.detail);
+
+  return customEvent;
+};
+
+var mediumZoomEsm = function mediumZoom(selector) {
+  var options = arguments.length > 1 && arguments[1] !== undefined ? arguments[1] : {};
+
+  /**
+   * Ensure the compatibility with IE11 if no Promise polyfill are used.
+   */
+  var Promise = window.Promise || function Promise(fn) {
+    function noop() {}
+    fn(noop, noop);
+  };
+
+  var _handleClick = function _handleClick(event) {
+    var target = event.target;
+
+
+    if (target === overlay) {
+      close();
+      return;
+    }
+
+    if (images.indexOf(target) === -1) {
+      return;
+    }
+
+    toggle({ target: target });
+  };
+
+  var _handleScroll = function _handleScroll() {
+    if (isAnimating || !active.original) {
+      return;
+    }
+
+    var currentScroll = window.pageYOffset || document.documentElement.scrollTop || document.body.scrollTop || 0;
+
+    if (Math.abs(scrollTop - currentScroll) > zoomOptions.scrollOffset) {
+      setTimeout(close, 150);
+    }
+  };
+
+  var _handleKeyUp = function _handleKeyUp(event) {
+    var key = event.key || event.keyCode;
+
+    // Close if escape key is pressed
+    if (key === 'Escape' || key === 'Esc' || key === 27) {
+      close();
+    }
+  };
+
+  var update = function update() {
+    var options = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {};
+
+    var newOptions = options;
+
+    if (options.background) {
+      overlay.style.background = options.background;
+    }
+
+    if (options.container && options.container instanceof Object) {
+      newOptions.container = _extends({}, zoomOptions.container, options.container);
+    }
+
+    if (options.template) {
+      var template = isNode(options.template) ? options.template : document.querySelector(options.template);
+
+      newOptions.template = template;
+    }
+
+    zoomOptions = _extends({}, zoomOptions, newOptions);
+
+    images.forEach(function (image) {
+      image.dispatchEvent(createCustomEvent('medium-zoom:update', {
+        detail: { zoom: zoom }
+      }));
+    });
+
+    return zoom;
+  };
+
+  var clone = function clone() {
+    var options = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {};
+    return mediumZoomEsm(_extends({}, zoomOptions, options));
+  };
+
+  var attach = function attach() {
+    for (var _len = arguments.length, selectors = Array(_len), _key = 0; _key < _len; _key++) {
+      selectors[_key] = arguments[_key];
+    }
+
+    var newImages = selectors.reduce(function (imagesAccumulator, currentSelector) {
+      return [].concat(imagesAccumulator, getImagesFromSelector(currentSelector));
+    }, []);
+
+    newImages.filter(function (newImage) {
+      return images.indexOf(newImage) === -1;
+    }).forEach(function (newImage) {
+      images.push(newImage);
+      newImage.classList.add('medium-zoom-image');
+    });
+
+    eventListeners.forEach(function (_ref) {
+      var type = _ref.type,
+          listener = _ref.listener,
+          options = _ref.options;
+
+      newImages.forEach(function (image) {
+        image.addEventListener(type, listener, options);
+      });
+    });
+
+    return zoom;
+  };
+
+  var detach = function detach() {
+    for (var _len2 = arguments.length, selectors = Array(_len2), _key2 = 0; _key2 < _len2; _key2++) {
+      selectors[_key2] = arguments[_key2];
+    }
+
+    if (active.zoomed) {
+      close();
+    }
+
+    var imagesToDetach = selectors.length > 0 ? selectors.reduce(function (imagesAccumulator, currentSelector) {
+      return [].concat(imagesAccumulator, getImagesFromSelector(currentSelector));
+    }, []) : images;
+
+    imagesToDetach.forEach(function (image) {
+      image.classList.remove('medium-zoom-image');
+      image.dispatchEvent(createCustomEvent('medium-zoom:detach', {
+        detail: { zoom: zoom }
+      }));
+    });
+
+    images = images.filter(function (image) {
+      return imagesToDetach.indexOf(image) === -1;
+    });
+
+    return zoom;
+  };
+
+  var on = function on(type, listener) {
+    var options = arguments.length > 2 && arguments[2] !== undefined ? arguments[2] : {};
+
+    images.forEach(function (image) {
+      image.addEventListener('medium-zoom:' + type, listener, options);
+    });
+
+    eventListeners.push({ type: 'medium-zoom:' + type, listener: listener, options: options });
+
+    return zoom;
+  };
+
+  var off = function off(type, listener) {
+    var options = arguments.length > 2 && arguments[2] !== undefined ? arguments[2] : {};
+
+    images.forEach(function (image) {
+      image.removeEventListener('medium-zoom:' + type, listener, options);
+    });
+
+    eventListeners = eventListeners.filter(function (eventListener) {
+      return !(eventListener.type === 'medium-zoom:' + type && eventListener.listener.toString() === listener.toString());
+    });
+
+    return zoom;
+  };
+
+  var open = function open() {
+    var _ref2 = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {},
+        target = _ref2.target;
+
+    var _animate = function _animate() {
+      var container = {
+        width: document.documentElement.clientWidth,
+        height: document.documentElement.clientHeight,
+        left: 0,
+        top: 0,
+        right: 0,
+        bottom: 0
+      };
+      var viewportWidth = void 0;
+      var viewportHeight = void 0;
+
+      if (zoomOptions.container) {
+        if (zoomOptions.container instanceof Object) {
+          // The container is given as an object with properties like width, height, left, top
+          container = _extends({}, container, zoomOptions.container);
+
+          // We need to adjust custom options like container.right or container.bottom
+          viewportWidth = container.width - container.left - container.right - zoomOptions.margin * 2;
+          viewportHeight = container.height - container.top - container.bottom - zoomOptions.margin * 2;
+        } else {
+          // The container is given as an element
+          var zoomContainer = isNode(zoomOptions.container) ? zoomOptions.container : document.querySelector(zoomOptions.container);
+
+          var _zoomContainer$getBou = zoomContainer.getBoundingClientRect(),
+              _width = _zoomContainer$getBou.width,
+              _height = _zoomContainer$getBou.height,
+              _left = _zoomContainer$getBou.left,
+              _top = _zoomContainer$getBou.top;
+
+          container = _extends({}, container, {
+            width: _width,
+            height: _height,
+            left: _left,
+            top: _top
+          });
+        }
+      }
+
+      viewportWidth = viewportWidth || container.width - zoomOptions.margin * 2;
+      viewportHeight = viewportHeight || container.height - zoomOptions.margin * 2;
+
+      var zoomTarget = active.zoomedHd || active.original;
+      var naturalWidth = isSvg(zoomTarget) ? viewportWidth : zoomTarget.naturalWidth || viewportWidth;
+      var naturalHeight = isSvg(zoomTarget) ? viewportHeight : zoomTarget.naturalHeight || viewportHeight;
+
+      var _zoomTarget$getBoundi = zoomTarget.getBoundingClientRect(),
+          top = _zoomTarget$getBoundi.top,
+          left = _zoomTarget$getBoundi.left,
+          width = _zoomTarget$getBoundi.width,
+          height = _zoomTarget$getBoundi.height;
+
+      var scaleX = Math.min(naturalWidth, viewportWidth) / width;
+      var scaleY = Math.min(naturalHeight, viewportHeight) / height;
+      var scale = Math.min(scaleX, scaleY);
+      var translateX = (-left + (viewportWidth - width) / 2 + zoomOptions.margin + container.left) / scale;
+      var translateY = (-top + (viewportHeight - height) / 2 + zoomOptions.margin + container.top) / scale;
+      var transform = 'scale(' + scale + ') translate3d(' + translateX + 'px, ' + translateY + 'px, 0)';
+
+      active.zoomed.style.transform = transform;
+
+      if (active.zoomedHd) {
+        active.zoomedHd.style.transform = transform;
+      }
+    };
+
+    return new Promise(function (resolve) {
+      if (target && images.indexOf(target) === -1) {
+        resolve(zoom);
+        return;
+      }
+
+      var _handleOpenEnd = function _handleOpenEnd() {
+        isAnimating = false;
+        active.zoomed.removeEventListener('transitionend', _handleOpenEnd);
+        active.original.dispatchEvent(createCustomEvent('medium-zoom:opened', {
+          detail: { zoom: zoom }
+        }));
+
+        resolve(zoom);
+      };
+
+      if (active.zoomed) {
+        resolve(zoom);
+        return;
+      }
+
+      if (target) {
+        // The zoom was triggered manually via a click
+        active.original = target;
+      } else if (images.length > 0) {
+var _images = images;
+        active.original = _images[0];
+      } else {
+        resolve(zoom);
+        return;
+      }
+
+      active.original.dispatchEvent(createCustomEvent('medium-zoom:open', {
+        detail: { zoom: zoom }
+      }));
+
+      scrollTop = window.pageYOffset || document.documentElement.scrollTop || document.body.scrollTop || 0;
+      isAnimating = true;
+      active.zoomed = cloneTarget(active.original);
+
+      document.body.appendChild(overlay);
+
+      if (zoomOptions.template) {
+        var template = isNode(zoomOptions.template) ? zoomOptions.template : document.querySelector(zoomOptions.template);
+        active.template = document.createElement('div');
+        active.template.appendChild(template.content.cloneNode(true));
+
+        document.body.appendChild(active.template);
+      }
+
+      document.body.appendChild(active.zoomed);
+
+      window.requestAnimationFrame(function () {
+        document.body.classList.add('medium-zoom--opened');
+      });
+
+      active.original.classList.add('medium-zoom-image--hidden');
+      active.zoomed.classList.add('medium-zoom-image--opened');
+
+      active.zoomed.addEventListener('click', close);
+      active.zoomed.addEventListener('transitionend', _handleOpenEnd);
+
+      if (active.original.getAttribute('data-zoom-src')) {
+        active.zoomedHd = active.zoomed.cloneNode();
+
+        // Reset the `scrset` property or the HD image won't load.
+        active.zoomedHd.removeAttribute('srcset');
+        active.zoomedHd.removeAttribute('sizes');
+
+        active.zoomedHd.src = active.zoomed.getAttribute('data-zoom-src');
+
+        active.zoomedHd.onerror = function () {
+          clearInterval(getZoomTargetSize);
+          console.warn('Unable to reach the zoom image target ' + active.zoomedHd.src);
+          active.zoomedHd = null;
+          _animate();
+        };
+
+        // We need to access the natural size of the full HD
+        // target as fast as possible to compute the animation.
+        var getZoomTargetSize = setInterval(function () {
+          if ( active.zoomedHd.complete) {
+            clearInterval(getZoomTargetSize);
+            active.zoomedHd.classList.add('medium-zoom-image--opened');
+            active.zoomedHd.addEventListener('click', close);
+            document.body.appendChild(active.zoomedHd);
+            _animate();
+          }
+        }, 10);
+      } else if (active.original.hasAttribute('srcset')) {
+        // If an image has a `srcset` attribuet, we don't know the dimensions of the
+        // zoomed (HD) image (like when `data-zoom-src` is specified).
+        // Therefore the approach is quite similar.
+        active.zoomedHd = active.zoomed.cloneNode();
+
+        // Resetting the sizes attribute tells the browser to load the
+        // image best fitting the current viewport size, respecting the `srcset`.
+        active.zoomedHd.removeAttribute('sizes');
+
+        // In Firefox, the `loading` attribute needs to be set to `eager` (default
+        // value) for the load event to be fired.
+        active.zoomedHd.removeAttribute('loading');
+
+        // Wait for the load event of the hd image. This will fire if the image
+        // is already cached.
+        var loadEventListener = active.zoomedHd.addEventListener('load', function () {
+          active.zoomedHd.removeEventListener('load', loadEventListener);
+          active.zoomedHd.classList.add('medium-zoom-image--opened');
+          active.zoomedHd.addEventListener('click', close);
+          document.body.appendChild(active.zoomedHd);
+          _animate();
+        });
+      } else {
+        _animate();
+      }
+    });
+  };
+
+  var close = function close() {
+    return new Promise(function (resolve) {
+      if (isAnimating || !active.original) {
+        resolve(zoom);
+        return;
+      }
+
+      var _handleCloseEnd = function _handleCloseEnd() {
+        active.original.classList.remove('medium-zoom-image--hidden');
+        document.body.removeChild(active.zoomed);
+        if (active.zoomedHd) {
+          document.body.removeChild(active.zoomedHd);
+        }
+        document.body.removeChild(overlay);
+        active.zoomed.classList.remove('medium-zoom-image--opened');
+        if (active.template) {
+          document.body.removeChild(active.template);
+        }
+
+        isAnimating = false;
+        active.zoomed.removeEventListener('transitionend', _handleCloseEnd);
+
+        active.original.dispatchEvent(createCustomEvent('medium-zoom:closed', {
+          detail: { zoom: zoom }
+        }));
+
+        active.original = null;
+        active.zoomed = null;
+        active.zoomedHd = null;
+        active.template = null;
+
+        resolve(zoom);
+      };
+
+      isAnimating = true;
+      document.body.classList.remove('medium-zoom--opened');
+      active.zoomed.style.transform = '';
+
+      if (active.zoomedHd) {
+        active.zoomedHd.style.transform = '';
+      }
+
+      // Fade out the template so it's not too abrupt
+      if (active.template) {
+        active.template.style.transition = 'opacity 150ms';
+        active.template.style.opacity = 0;
+      }
+
+      active.original.dispatchEvent(createCustomEvent('medium-zoom:close', {
+        detail: { zoom: zoom }
+      }));
+
+      active.zoomed.addEventListener('transitionend', _handleCloseEnd);
+    });
+  };
+
+  var toggle = function toggle() {
+    var _ref3 = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {},
+        target = _ref3.target;
+
+    if (active.original) {
+      return close();
+    }
+
+    return open({ target: target });
+  };
+
+  var getOptions = function getOptions() {
+    return zoomOptions;
+  };
+
+  var getImages = function getImages() {
+    return images;
+  };
+
+  var getZoomedImage = function getZoomedImage() {
+    return active.original;
+  };
+
+  var images = [];
+  var eventListeners = [];
+  var isAnimating = false;
+  var scrollTop = 0;
+  var zoomOptions = options;
+  var active = {
+    original: null,
+    zoomed: null,
+    zoomedHd: null,
+    template: null
+
+    // If the selector is omitted, it's replaced by the options
+  };if (Object.prototype.toString.call(selector) === '[object Object]') {
+    zoomOptions = selector;
+  } else if (selector || typeof selector === 'string' // to process empty string as a selector
+  ) {
+      attach(selector);
+    }
+
+  // Apply the default option values
+  zoomOptions = _extends({
+    margin: 0,
+    background: '#fff',
+    scrollOffset: 40,
+    container: null,
+    template: null
+  }, zoomOptions);
+
+  var overlay = createOverlay(zoomOptions.background);
+
+  document.addEventListener('click', _handleClick);
+  document.addEventListener('keyup', _handleKeyUp);
+  document.addEventListener('scroll', _handleScroll);
+  window.addEventListener('resize', close);
+
+  var zoom = {
+    open: open,
+    close: close,
+    toggle: toggle,
+    update: update,
+    clone: clone,
+    attach: attach,
+    detach: detach,
+    on: on,
+    off: off,
+    getOptions: getOptions,
+    getImages: getImages,
+    getZoomedImage: getZoomedImage
+  };
+
+  return zoom;
+};
+
+function styleInject(css, ref) {
+  if ( ref === void 0 ) ref = {};
+  var insertAt = ref.insertAt;
+
+  if (!css || typeof document === 'undefined') { return; }
+
+  var head = document.head || document.getElementsByTagName('head')[0];
+  var style = document.createElement('style');
+  style.type = 'text/css';
+
+  if (insertAt === 'top') {
+    if (head.firstChild) {
+      head.insertBefore(style, head.firstChild);
+    } else {
+      head.appendChild(style);
+    }
+  } else {
+    head.appendChild(style);
+  }
+
+  if (style.styleSheet) {
+    style.styleSheet.cssText = css;
+  } else {
+    style.appendChild(document.createTextNode(css));
+  }
+}
+
+var css = ".medium-zoom-overlay{position:fixed;top:0;right:0;bottom:0;left:0;opacity:0;transition:opacity .3s;will-change:opacity}.medium-zoom--opened .medium-zoom-overlay{cursor:pointer;cursor:zoom-out;opacity:1}.medium-zoom-image{cursor:pointer;cursor:zoom-in;transition:transform .3s cubic-bezier(.2,0,.2,1)!important}.medium-zoom-image--hidden{visibility:hidden}.medium-zoom-image--opened{position:relative;cursor:pointer;cursor:zoom-out;will-change:transform}";
+styleInject(css);
+
+export default mediumZoomEsm;
diff --git a/js/algolia-search.js b/js/algolia-search.js
new file mode 100644
index 00000000..949d87bc
--- /dev/null
+++ b/js/algolia-search.js
@@ -0,0 +1,74 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Algolia based search algorithm.
+ **************************************************/
+
+import {algoliaConfig, i18n, content_type} from '@params';
+
+function getTemplate(templateName) {
+  return document.querySelector(`#${templateName}-template`).innerHTML;
+}
+
+if (typeof instantsearch === 'function' && $('#search-box').length) {
+  const options = {
+    appId: algoliaConfig.appId,
+    apiKey: algoliaConfig.apiKey,
+    indexName: algoliaConfig.indexName,
+    routing: true,
+    searchParameters: {
+      hitsPerPage: 10,
+    },
+    searchFunction: function (helper) {
+      let searchResults = document.querySelector('#search-hits');
+      if (helper.state.query === '') {
+        searchResults.style.display = 'none';
+        return;
+      }
+      helper.search();
+      searchResults.style.display = 'block';
+    },
+  };
+
+  const search = instantsearch(options);
+
+  // Initialize search box.
+  search.addWidget(
+    instantsearch.widgets.searchBox({
+      container: '#search-box',
+      autofocus: false,
+      reset: true,
+      poweredBy: algoliaConfig.poweredBy,
+      placeholder: i18n.placeholder,
+    }),
+  );
+
+  // Initialize search results.
+  search.addWidget(
+    instantsearch.widgets.infiniteHits({
+      container: '#search-hits',
+      escapeHits: true,
+      templates: {
+        empty: '<div class="search-no-results">' + i18n.no_results + '</div>',
+        item: getTemplate('search-hit-algolia'),
+      },
+      cssClasses: {
+        showmoreButton: 'btn btn-outline-primary',
+      },
+    }),
+  );
+
+  // On render search results, localize the content type metadata.
+  search.on('render', function () {
+    $('.search-hit-type').each(function () {
+      let content_key = $(this).text();
+      if (content_key in content_type) {
+        $(this).text(content_type[content_key]);
+      }
+    });
+  });
+
+  // Start search.
+  search.start();
+}
diff --git a/js/isotope.pkgd.min.js b/js/isotope.pkgd.min.js
new file mode 100644
index 00000000..4d6c129c
--- /dev/null
+++ b/js/isotope.pkgd.min.js
@@ -0,0 +1,12 @@
+/*!
+ * Isotope PACKAGED v3.0.6
+ *
+ * Licensed GPLv3 for open source use
+ * or Isotope Commercial License for commercial use
+ *
+ * https://isotope.metafizzy.co
+ * Copyright 2010-2018 Metafizzy
+ */
+
+!function(t,e){"function"==typeof define&&define.amd?define("jquery-bridget/jquery-bridget",["jquery"],function(i){return e(t,i)}):"object"==typeof module&&module.exports?module.exports=e(t,require("jquery")):t.jQueryBridget=e(t,t.jQuery)}(window,function(t,e){"use strict";function i(i,s,a){function u(t,e,o){var n,s="$()."+i+'("'+e+'")';return t.each(function(t,u){var h=a.data(u,i);if(!h)return void r(i+" not initialized. Cannot call methods, i.e. "+s);var d=h[e];if(!d||"_"==e.charAt(0))return void r(s+" is not a valid method");var l=d.apply(h,o);n=void 0===n?l:n}),void 0!==n?n:t}function h(t,e){t.each(function(t,o){var n=a.data(o,i);n?(n.option(e),n._init()):(n=new s(o,e),a.data(o,i,n))})}a=a||e||t.jQuery,a&&(s.prototype.option||(s.prototype.option=function(t){a.isPlainObject(t)&&(this.options=a.extend(!0,this.options,t))}),a.fn[i]=function(t){if("string"==typeof t){var e=n.call(arguments,1);return u(this,t,e)}return h(this,t),this},o(a))}function o(t){!t||t&&t.bridget||(t.bridget=i)}var n=Array.prototype.slice,s=t.console,r="undefined"==typeof s?function(){}:function(t){s.error(t)};return o(e||t.jQuery),i}),function(t,e){"function"==typeof define&&define.amd?define("ev-emitter/ev-emitter",e):"object"==typeof module&&module.exports?module.exports=e():t.EvEmitter=e()}("undefined"!=typeof window?window:this,function(){function t(){}var e=t.prototype;return e.on=function(t,e){if(t&&e){var i=this._events=this._events||{},o=i[t]=i[t]||[];return o.indexOf(e)==-1&&o.push(e),this}},e.once=function(t,e){if(t&&e){this.on(t,e);var i=this._onceEvents=this._onceEvents||{},o=i[t]=i[t]||{};return o[e]=!0,this}},e.off=function(t,e){var i=this._events&&this._events[t];if(i&&i.length){var o=i.indexOf(e);return o!=-1&&i.splice(o,1),this}},e.emitEvent=function(t,e){var i=this._events&&this._events[t];if(i&&i.length){i=i.slice(0),e=e||[];for(var o=this._onceEvents&&this._onceEvents[t],n=0;n<i.length;n++){var s=i[n],r=o&&o[s];r&&(this.off(t,s),delete o[s]),s.apply(this,e)}return this}},e.allOff=function(){delete this._events,delete this._onceEvents},t}),function(t,e){"function"==typeof define&&define.amd?define("get-size/get-size",e):"object"==typeof module&&module.exports?module.exports=e():t.getSize=e()}(window,function(){"use strict";function t(t){var e=parseFloat(t),i=t.indexOf("%")==-1&&!isNaN(e);return i&&e}function e(){}function i(){for(var t={width:0,height:0,innerWidth:0,innerHeight:0,outerWidth:0,outerHeight:0},e=0;e<h;e++){var i=u[e];t[i]=0}return t}function o(t){var e=getComputedStyle(t);return e||a("Style returned "+e+". Are you running this code in a hidden iframe on Firefox? See https://bit.ly/getsizebug1"),e}function n(){if(!d){d=!0;var e=document.createElement("div");e.style.width="200px",e.style.padding="1px 2px 3px 4px",e.style.borderStyle="solid",e.style.borderWidth="1px 2px 3px 4px",e.style.boxSizing="border-box";var i=document.body||document.documentElement;i.appendChild(e);var n=o(e);r=200==Math.round(t(n.width)),s.isBoxSizeOuter=r,i.removeChild(e)}}function s(e){if(n(),"string"==typeof e&&(e=document.querySelector(e)),e&&"object"==typeof e&&e.nodeType){var s=o(e);if("none"==s.display)return i();var a={};a.width=e.offsetWidth,a.height=e.offsetHeight;for(var d=a.isBorderBox="border-box"==s.boxSizing,l=0;l<h;l++){var f=u[l],c=s[f],m=parseFloat(c);a[f]=isNaN(m)?0:m}var p=a.paddingLeft+a.paddingRight,y=a.paddingTop+a.paddingBottom,g=a.marginLeft+a.marginRight,v=a.marginTop+a.marginBottom,_=a.borderLeftWidth+a.borderRightWidth,z=a.borderTopWidth+a.borderBottomWidth,I=d&&r,x=t(s.width);x!==!1&&(a.width=x+(I?0:p+_));var S=t(s.height);return S!==!1&&(a.height=S+(I?0:y+z)),a.innerWidth=a.width-(p+_),a.innerHeight=a.height-(y+z),a.outerWidth=a.width+g,a.outerHeight=a.height+v,a}}var r,a="undefined"==typeof console?e:function(t){console.error(t)},u=["paddingLeft","paddingRight","paddingTop","paddingBottom","marginLeft","marginRight","marginTop","marginBottom","borderLeftWidth","borderRightWidth","borderTopWidth","borderBottomWidth"],h=u.length,d=!1;return s}),function(t,e){"use strict";"function"==typeof define&&define.amd?define("desandro-matches-selector/matches-selector",e):"object"==typeof module&&module.exports?module.exports=e():t.matchesSelector=e()}(window,function(){"use strict";var t=function(){var t=window.Element.prototype;if(t.matches)return"matches";if(t.matchesSelector)return"matchesSelector";for(var e=["webkit","moz","ms","o"],i=0;i<e.length;i++){var o=e[i],n=o+"MatchesSelector";if(t[n])return n}}();return function(e,i){return e[t](i)}}),function(t,e){"function"==typeof define&&define.amd?define("fizzy-ui-utils/utils",["desandro-matches-selector/matches-selector"],function(i){return e(t,i)}):"object"==typeof module&&module.exports?module.exports=e(t,require("desandro-matches-selector")):t.fizzyUIUtils=e(t,t.matchesSelector)}(window,function(t,e){var i={};i.extend=function(t,e){for(var i in e)t[i]=e[i];return t},i.modulo=function(t,e){return(t%e+e)%e};var o=Array.prototype.slice;i.makeArray=function(t){if(Array.isArray(t))return t;if(null===t||void 0===t)return[];var e="object"==typeof t&&"number"==typeof t.length;return e?o.call(t):[t]},i.removeFrom=function(t,e){var i=t.indexOf(e);i!=-1&&t.splice(i,1)},i.getParent=function(t,i){for(;t.parentNode&&t!=document.body;)if(t=t.parentNode,e(t,i))return t},i.getQueryElement=function(t){return"string"==typeof t?document.querySelector(t):t},i.handleEvent=function(t){var e="on"+t.type;this[e]&&this[e](t)},i.filterFindElements=function(t,o){t=i.makeArray(t);var n=[];return t.forEach(function(t){if(t instanceof HTMLElement){if(!o)return void n.push(t);e(t,o)&&n.push(t);for(var i=t.querySelectorAll(o),s=0;s<i.length;s++)n.push(i[s])}}),n},i.debounceMethod=function(t,e,i){i=i||100;var o=t.prototype[e],n=e+"Timeout";t.prototype[e]=function(){var t=this[n];clearTimeout(t);var e=arguments,s=this;this[n]=setTimeout(function(){o.apply(s,e),delete s[n]},i)}},i.docReady=function(t){var e=document.readyState;"complete"==e||"interactive"==e?setTimeout(t):document.addEventListener("DOMContentLoaded",t)},i.toDashed=function(t){return t.replace(/(.)([A-Z])/g,function(t,e,i){return e+"-"+i}).toLowerCase()};var n=t.console;return i.htmlInit=function(e,o){i.docReady(function(){var s=i.toDashed(o),r="data-"+s,a=document.querySelectorAll("["+r+"]"),u=document.querySelectorAll(".js-"+s),h=i.makeArray(a).concat(i.makeArray(u)),d=r+"-options",l=t.jQuery;h.forEach(function(t){var i,s=t.getAttribute(r)||t.getAttribute(d);try{i=s&&JSON.parse(s)}catch(a){return void(n&&n.error("Error parsing "+r+" on "+t.className+": "+a))}var u=new e(t,i);l&&l.data(t,o,u)})})},i}),function(t,e){"function"==typeof define&&define.amd?define("outlayer/item",["ev-emitter/ev-emitter","get-size/get-size"],e):"object"==typeof module&&module.exports?module.exports=e(require("ev-emitter"),require("get-size")):(t.Outlayer={},t.Outlayer.Item=e(t.EvEmitter,t.getSize))}(window,function(t,e){"use strict";function i(t){for(var e in t)return!1;return e=null,!0}function o(t,e){t&&(this.element=t,this.layout=e,this.position={x:0,y:0},this._create())}function n(t){return t.replace(/([A-Z])/g,function(t){return"-"+t.toLowerCase()})}var s=document.documentElement.style,r="string"==typeof s.transition?"transition":"WebkitTransition",a="string"==typeof s.transform?"transform":"WebkitTransform",u={WebkitTransition:"webkitTransitionEnd",transition:"transitionend"}[r],h={transform:a,transition:r,transitionDuration:r+"Duration",transitionProperty:r+"Property",transitionDelay:r+"Delay"},d=o.prototype=Object.create(t.prototype);d.constructor=o,d._create=function(){this._transn={ingProperties:{},clean:{},onEnd:{}},this.css({position:"absolute"})},d.handleEvent=function(t){var e="on"+t.type;this[e]&&this[e](t)},d.getSize=function(){this.size=e(this.element)},d.css=function(t){var e=this.element.style;for(var i in t){var o=h[i]||i;e[o]=t[i]}},d.getPosition=function(){var t=getComputedStyle(this.element),e=this.layout._getOption("originLeft"),i=this.layout._getOption("originTop"),o=t[e?"left":"right"],n=t[i?"top":"bottom"],s=parseFloat(o),r=parseFloat(n),a=this.layout.size;o.indexOf("%")!=-1&&(s=s/100*a.width),n.indexOf("%")!=-1&&(r=r/100*a.height),s=isNaN(s)?0:s,r=isNaN(r)?0:r,s-=e?a.paddingLeft:a.paddingRight,r-=i?a.paddingTop:a.paddingBottom,this.position.x=s,this.position.y=r},d.layoutPosition=function(){var t=this.layout.size,e={},i=this.layout._getOption("originLeft"),o=this.layout._getOption("originTop"),n=i?"paddingLeft":"paddingRight",s=i?"left":"right",r=i?"right":"left",a=this.position.x+t[n];e[s]=this.getXValue(a),e[r]="";var u=o?"paddingTop":"paddingBottom",h=o?"top":"bottom",d=o?"bottom":"top",l=this.position.y+t[u];e[h]=this.getYValue(l),e[d]="",this.css(e),this.emitEvent("layout",[this])},d.getXValue=function(t){var e=this.layout._getOption("horizontal");return this.layout.options.percentPosition&&!e?t/this.layout.size.width*100+"%":t+"px"},d.getYValue=function(t){var e=this.layout._getOption("horizontal");return this.layout.options.percentPosition&&e?t/this.layout.size.height*100+"%":t+"px"},d._transitionTo=function(t,e){this.getPosition();var i=this.position.x,o=this.position.y,n=t==this.position.x&&e==this.position.y;if(this.setPosition(t,e),n&&!this.isTransitioning)return void this.layoutPosition();var s=t-i,r=e-o,a={};a.transform=this.getTranslate(s,r),this.transition({to:a,onTransitionEnd:{transform:this.layoutPosition},isCleaning:!0})},d.getTranslate=function(t,e){var i=this.layout._getOption("originLeft"),o=this.layout._getOption("originTop");return t=i?t:-t,e=o?e:-e,"translate3d("+t+"px, "+e+"px, 0)"},d.goTo=function(t,e){this.setPosition(t,e),this.layoutPosition()},d.moveTo=d._transitionTo,d.setPosition=function(t,e){this.position.x=parseFloat(t),this.position.y=parseFloat(e)},d._nonTransition=function(t){this.css(t.to),t.isCleaning&&this._removeStyles(t.to);for(var e in t.onTransitionEnd)t.onTransitionEnd[e].call(this)},d.transition=function(t){if(!parseFloat(this.layout.options.transitionDuration))return void this._nonTransition(t);var e=this._transn;for(var i in t.onTransitionEnd)e.onEnd[i]=t.onTransitionEnd[i];for(i in t.to)e.ingProperties[i]=!0,t.isCleaning&&(e.clean[i]=!0);if(t.from){this.css(t.from);var o=this.element.offsetHeight;o=null}this.enableTransition(t.to),this.css(t.to),this.isTransitioning=!0};var l="opacity,"+n(a);d.enableTransition=function(){if(!this.isTransitioning){var t=this.layout.options.transitionDuration;t="number"==typeof t?t+"ms":t,this.css({transitionProperty:l,transitionDuration:t,transitionDelay:this.staggerDelay||0}),this.element.addEventListener(u,this,!1)}},d.onwebkitTransitionEnd=function(t){this.ontransitionend(t)},d.onotransitionend=function(t){this.ontransitionend(t)};var f={"-webkit-transform":"transform"};d.ontransitionend=function(t){if(t.target===this.element){var e=this._transn,o=f[t.propertyName]||t.propertyName;if(delete e.ingProperties[o],i(e.ingProperties)&&this.disableTransition(),o in e.clean&&(this.element.style[t.propertyName]="",delete e.clean[o]),o in e.onEnd){var n=e.onEnd[o];n.call(this),delete e.onEnd[o]}this.emitEvent("transitionEnd",[this])}},d.disableTransition=function(){this.removeTransitionStyles(),this.element.removeEventListener(u,this,!1),this.isTransitioning=!1},d._removeStyles=function(t){var e={};for(var i in t)e[i]="";this.css(e)};var c={transitionProperty:"",transitionDuration:"",transitionDelay:""};return d.removeTransitionStyles=function(){this.css(c)},d.stagger=function(t){t=isNaN(t)?0:t,this.staggerDelay=t+"ms"},d.removeElem=function(){this.element.parentNode.removeChild(this.element),this.css({display:""}),this.emitEvent("remove",[this])},d.remove=function(){return r&&parseFloat(this.layout.options.transitionDuration)?(this.once("transitionEnd",function(){this.removeElem()}),void this.hide()):void this.removeElem()},d.reveal=function(){delete this.isHidden,this.css({display:""});var t=this.layout.options,e={},i=this.getHideRevealTransitionEndProperty("visibleStyle");e[i]=this.onRevealTransitionEnd,this.transition({from:t.hiddenStyle,to:t.visibleStyle,isCleaning:!0,onTransitionEnd:e})},d.onRevealTransitionEnd=function(){this.isHidden||this.emitEvent("reveal")},d.getHideRevealTransitionEndProperty=function(t){var e=this.layout.options[t];if(e.opacity)return"opacity";for(var i in e)return i},d.hide=function(){this.isHidden=!0,this.css({display:""});var t=this.layout.options,e={},i=this.getHideRevealTransitionEndProperty("hiddenStyle");e[i]=this.onHideTransitionEnd,this.transition({from:t.visibleStyle,to:t.hiddenStyle,isCleaning:!0,onTransitionEnd:e})},d.onHideTransitionEnd=function(){this.isHidden&&(this.css({display:"none"}),this.emitEvent("hide"))},d.destroy=function(){this.css({position:"",left:"",right:"",top:"",bottom:"",transition:"",transform:""})},o}),function(t,e){"use strict";"function"==typeof define&&define.amd?define("outlayer/outlayer",["ev-emitter/ev-emitter","get-size/get-size","fizzy-ui-utils/utils","./item"],function(i,o,n,s){return e(t,i,o,n,s)}):"object"==typeof module&&module.exports?module.exports=e(t,require("ev-emitter"),require("get-size"),require("fizzy-ui-utils"),require("./item")):t.Outlayer=e(t,t.EvEmitter,t.getSize,t.fizzyUIUtils,t.Outlayer.Item)}(window,function(t,e,i,o,n){"use strict";function s(t,e){var i=o.getQueryElement(t);if(!i)return void(u&&u.error("Bad element for "+this.constructor.namespace+": "+(i||t)));this.element=i,h&&(this.$element=h(this.element)),this.options=o.extend({},this.constructor.defaults),this.option(e);var n=++l;this.element.outlayerGUID=n,f[n]=this,this._create();var s=this._getOption("initLayout");s&&this.layout()}function r(t){function e(){t.apply(this,arguments)}return e.prototype=Object.create(t.prototype),e.prototype.constructor=e,e}function a(t){if("number"==typeof t)return t;var e=t.match(/(^\d*\.?\d*)(\w*)/),i=e&&e[1],o=e&&e[2];if(!i.length)return 0;i=parseFloat(i);var n=m[o]||1;return i*n}var u=t.console,h=t.jQuery,d=function(){},l=0,f={};s.namespace="outlayer",s.Item=n,s.defaults={containerStyle:{position:"relative"},initLayout:!0,originLeft:!0,originTop:!0,resize:!0,resizeContainer:!0,transitionDuration:"0.4s",hiddenStyle:{opacity:0,transform:"scale(0.001)"},visibleStyle:{opacity:1,transform:"scale(1)"}};var c=s.prototype;o.extend(c,e.prototype),c.option=function(t){o.extend(this.options,t)},c._getOption=function(t){var e=this.constructor.compatOptions[t];return e&&void 0!==this.options[e]?this.options[e]:this.options[t]},s.compatOptions={initLayout:"isInitLayout",horizontal:"isHorizontal",layoutInstant:"isLayoutInstant",originLeft:"isOriginLeft",originTop:"isOriginTop",resize:"isResizeBound",resizeContainer:"isResizingContainer"},c._create=function(){this.reloadItems(),this.stamps=[],this.stamp(this.options.stamp),o.extend(this.element.style,this.options.containerStyle);var t=this._getOption("resize");t&&this.bindResize()},c.reloadItems=function(){this.items=this._itemize(this.element.children)},c._itemize=function(t){for(var e=this._filterFindItemElements(t),i=this.constructor.Item,o=[],n=0;n<e.length;n++){var s=e[n],r=new i(s,this);o.push(r)}return o},c._filterFindItemElements=function(t){return o.filterFindElements(t,this.options.itemSelector)},c.getItemElements=function(){return this.items.map(function(t){return t.element})},c.layout=function(){this._resetLayout(),this._manageStamps();var t=this._getOption("layoutInstant"),e=void 0!==t?t:!this._isLayoutInited;this.layoutItems(this.items,e),this._isLayoutInited=!0},c._init=c.layout,c._resetLayout=function(){this.getSize()},c.getSize=function(){this.size=i(this.element)},c._getMeasurement=function(t,e){var o,n=this.options[t];n?("string"==typeof n?o=this.element.querySelector(n):n instanceof HTMLElement&&(o=n),this[t]=o?i(o)[e]:n):this[t]=0},c.layoutItems=function(t,e){t=this._getItemsForLayout(t),this._layoutItems(t,e),this._postLayout()},c._getItemsForLayout=function(t){return t.filter(function(t){return!t.isIgnored})},c._layoutItems=function(t,e){if(this._emitCompleteOnItems("layout",t),t&&t.length){var i=[];t.forEach(function(t){var o=this._getItemLayoutPosition(t);o.item=t,o.isInstant=e||t.isLayoutInstant,i.push(o)},this),this._processLayoutQueue(i)}},c._getItemLayoutPosition=function(){return{x:0,y:0}},c._processLayoutQueue=function(t){this.updateStagger(),t.forEach(function(t,e){this._positionItem(t.item,t.x,t.y,t.isInstant,e)},this)},c.updateStagger=function(){var t=this.options.stagger;return null===t||void 0===t?void(this.stagger=0):(this.stagger=a(t),this.stagger)},c._positionItem=function(t,e,i,o,n){o?t.goTo(e,i):(t.stagger(n*this.stagger),t.moveTo(e,i))},c._postLayout=function(){this.resizeContainer()},c.resizeContainer=function(){var t=this._getOption("resizeContainer");if(t){var e=this._getContainerSize();e&&(this._setContainerMeasure(e.width,!0),this._setContainerMeasure(e.height,!1))}},c._getContainerSize=d,c._setContainerMeasure=function(t,e){if(void 0!==t){var i=this.size;i.isBorderBox&&(t+=e?i.paddingLeft+i.paddingRight+i.borderLeftWidth+i.borderRightWidth:i.paddingBottom+i.paddingTop+i.borderTopWidth+i.borderBottomWidth),t=Math.max(t,0),this.element.style[e?"width":"height"]=t+"px"}},c._emitCompleteOnItems=function(t,e){function i(){n.dispatchEvent(t+"Complete",null,[e])}function o(){r++,r==s&&i()}var n=this,s=e.length;if(!e||!s)return void i();var r=0;e.forEach(function(e){e.once(t,o)})},c.dispatchEvent=function(t,e,i){var o=e?[e].concat(i):i;if(this.emitEvent(t,o),h)if(this.$element=this.$element||h(this.element),e){var n=h.Event(e);n.type=t,this.$element.trigger(n,i)}else this.$element.trigger(t,i)},c.ignore=function(t){var e=this.getItem(t);e&&(e.isIgnored=!0)},c.unignore=function(t){var e=this.getItem(t);e&&delete e.isIgnored},c.stamp=function(t){t=this._find(t),t&&(this.stamps=this.stamps.concat(t),t.forEach(this.ignore,this))},c.unstamp=function(t){t=this._find(t),t&&t.forEach(function(t){o.removeFrom(this.stamps,t),this.unignore(t)},this)},c._find=function(t){if(t)return"string"==typeof t&&(t=this.element.querySelectorAll(t)),t=o.makeArray(t)},c._manageStamps=function(){this.stamps&&this.stamps.length&&(this._getBoundingRect(),this.stamps.forEach(this._manageStamp,this))},c._getBoundingRect=function(){var t=this.element.getBoundingClientRect(),e=this.size;this._boundingRect={left:t.left+e.paddingLeft+e.borderLeftWidth,top:t.top+e.paddingTop+e.borderTopWidth,right:t.right-(e.paddingRight+e.borderRightWidth),bottom:t.bottom-(e.paddingBottom+e.borderBottomWidth)}},c._manageStamp=d,c._getElementOffset=function(t){var e=t.getBoundingClientRect(),o=this._boundingRect,n=i(t),s={left:e.left-o.left-n.marginLeft,top:e.top-o.top-n.marginTop,right:o.right-e.right-n.marginRight,bottom:o.bottom-e.bottom-n.marginBottom};return s},c.handleEvent=o.handleEvent,c.bindResize=function(){t.addEventListener("resize",this),this.isResizeBound=!0},c.unbindResize=function(){t.removeEventListener("resize",this),this.isResizeBound=!1},c.onresize=function(){this.resize()},o.debounceMethod(s,"onresize",100),c.resize=function(){this.isResizeBound&&this.needsResizeLayout()&&this.layout()},c.needsResizeLayout=function(){var t=i(this.element),e=this.size&&t;return e&&t.innerWidth!==this.size.innerWidth},c.addItems=function(t){var e=this._itemize(t);return e.length&&(this.items=this.items.concat(e)),e},c.appended=function(t){var e=this.addItems(t);e.length&&(this.layoutItems(e,!0),this.reveal(e))},c.prepended=function(t){var e=this._itemize(t);if(e.length){var i=this.items.slice(0);this.items=e.concat(i),this._resetLayout(),this._manageStamps(),this.layoutItems(e,!0),this.reveal(e),this.layoutItems(i)}},c.reveal=function(t){if(this._emitCompleteOnItems("reveal",t),t&&t.length){var e=this.updateStagger();t.forEach(function(t,i){t.stagger(i*e),t.reveal()})}},c.hide=function(t){if(this._emitCompleteOnItems("hide",t),t&&t.length){var e=this.updateStagger();t.forEach(function(t,i){t.stagger(i*e),t.hide()})}},c.revealItemElements=function(t){var e=this.getItems(t);this.reveal(e)},c.hideItemElements=function(t){var e=this.getItems(t);this.hide(e)},c.getItem=function(t){for(var e=0;e<this.items.length;e++){var i=this.items[e];if(i.element==t)return i}},c.getItems=function(t){t=o.makeArray(t);var e=[];return t.forEach(function(t){var i=this.getItem(t);i&&e.push(i)},this),e},c.remove=function(t){var e=this.getItems(t);this._emitCompleteOnItems("remove",e),e&&e.length&&e.forEach(function(t){t.remove(),o.removeFrom(this.items,t)},this)},c.destroy=function(){var t=this.element.style;t.height="",t.position="",t.width="",this.items.forEach(function(t){t.destroy()}),this.unbindResize();var e=this.element.outlayerGUID;delete f[e],delete this.element.outlayerGUID,h&&h.removeData(this.element,this.constructor.namespace)},s.data=function(t){t=o.getQueryElement(t);var e=t&&t.outlayerGUID;return e&&f[e]},s.create=function(t,e){var i=r(s);return i.defaults=o.extend({},s.defaults),o.extend(i.defaults,e),i.compatOptions=o.extend({},s.compatOptions),i.namespace=t,i.data=s.data,i.Item=r(n),o.htmlInit(i,t),h&&h.bridget&&h.bridget(t,i),i};var m={ms:1,s:1e3};return s.Item=n,s}),function(t,e){"function"==typeof define&&define.amd?define("isotope-layout/js/item",["outlayer/outlayer"],e):"object"==typeof module&&module.exports?module.exports=e(require("outlayer")):(t.Isotope=t.Isotope||{},t.Isotope.Item=e(t.Outlayer))}(window,function(t){"use strict";function e(){t.Item.apply(this,arguments)}var i=e.prototype=Object.create(t.Item.prototype),o=i._create;i._create=function(){this.id=this.layout.itemGUID++,o.call(this),this.sortData={}},i.updateSortData=function(){if(!this.isIgnored){this.sortData.id=this.id,this.sortData["original-order"]=this.id,this.sortData.random=Math.random();var t=this.layout.options.getSortData,e=this.layout._sorters;for(var i in t){var o=e[i];this.sortData[i]=o(this.element,this)}}};var n=i.destroy;return i.destroy=function(){n.apply(this,arguments),this.css({display:""})},e}),function(t,e){"function"==typeof define&&define.amd?define("isotope-layout/js/layout-mode",["get-size/get-size","outlayer/outlayer"],e):"object"==typeof module&&module.exports?module.exports=e(require("get-size"),require("outlayer")):(t.Isotope=t.Isotope||{},t.Isotope.LayoutMode=e(t.getSize,t.Outlayer))}(window,function(t,e){"use strict";function i(t){this.isotope=t,t&&(this.options=t.options[this.namespace],this.element=t.element,this.items=t.filteredItems,this.size=t.size)}var o=i.prototype,n=["_resetLayout","_getItemLayoutPosition","_manageStamp","_getContainerSize","_getElementOffset","needsResizeLayout","_getOption"];return n.forEach(function(t){o[t]=function(){return e.prototype[t].apply(this.isotope,arguments)}}),o.needsVerticalResizeLayout=function(){var e=t(this.isotope.element),i=this.isotope.size&&e;return i&&e.innerHeight!=this.isotope.size.innerHeight},o._getMeasurement=function(){this.isotope._getMeasurement.apply(this,arguments)},o.getColumnWidth=function(){this.getSegmentSize("column","Width")},o.getRowHeight=function(){this.getSegmentSize("row","Height")},o.getSegmentSize=function(t,e){var i=t+e,o="outer"+e;if(this._getMeasurement(i,o),!this[i]){var n=this.getFirstItemSize();this[i]=n&&n[o]||this.isotope.size["inner"+e]}},o.getFirstItemSize=function(){var e=this.isotope.filteredItems[0];return e&&e.element&&t(e.element)},o.layout=function(){this.isotope.layout.apply(this.isotope,arguments)},o.getSize=function(){this.isotope.getSize(),this.size=this.isotope.size},i.modes={},i.create=function(t,e){function n(){i.apply(this,arguments)}return n.prototype=Object.create(o),n.prototype.constructor=n,e&&(n.options=e),n.prototype.namespace=t,i.modes[t]=n,n},i}),function(t,e){"function"==typeof define&&define.amd?define("masonry-layout/masonry",["outlayer/outlayer","get-size/get-size"],e):"object"==typeof module&&module.exports?module.exports=e(require("outlayer"),require("get-size")):t.Masonry=e(t.Outlayer,t.getSize)}(window,function(t,e){var i=t.create("masonry");i.compatOptions.fitWidth="isFitWidth";var o=i.prototype;return o._resetLayout=function(){this.getSize(),this._getMeasurement("columnWidth","outerWidth"),this._getMeasurement("gutter","outerWidth"),this.measureColumns(),this.colYs=[];for(var t=0;t<this.cols;t++)this.colYs.push(0);this.maxY=0,this.horizontalColIndex=0},o.measureColumns=function(){if(this.getContainerWidth(),!this.columnWidth){var t=this.items[0],i=t&&t.element;this.columnWidth=i&&e(i).outerWidth||this.containerWidth}var o=this.columnWidth+=this.gutter,n=this.containerWidth+this.gutter,s=n/o,r=o-n%o,a=r&&r<1?"round":"floor";s=Math[a](s),this.cols=Math.max(s,1)},o.getContainerWidth=function(){var t=this._getOption("fitWidth"),i=t?this.element.parentNode:this.element,o=e(i);this.containerWidth=o&&o.innerWidth},o._getItemLayoutPosition=function(t){t.getSize();var e=t.size.outerWidth%this.columnWidth,i=e&&e<1?"round":"ceil",o=Math[i](t.size.outerWidth/this.columnWidth);o=Math.min(o,this.cols);for(var n=this.options.horizontalOrder?"_getHorizontalColPosition":"_getTopColPosition",s=this[n](o,t),r={x:this.columnWidth*s.col,y:s.y},a=s.y+t.size.outerHeight,u=o+s.col,h=s.col;h<u;h++)this.colYs[h]=a;return r},o._getTopColPosition=function(t){var e=this._getTopColGroup(t),i=Math.min.apply(Math,e);return{col:e.indexOf(i),y:i}},o._getTopColGroup=function(t){if(t<2)return this.colYs;for(var e=[],i=this.cols+1-t,o=0;o<i;o++)e[o]=this._getColGroupY(o,t);return e},o._getColGroupY=function(t,e){if(e<2)return this.colYs[t];var i=this.colYs.slice(t,t+e);return Math.max.apply(Math,i)},o._getHorizontalColPosition=function(t,e){var i=this.horizontalColIndex%this.cols,o=t>1&&i+t>this.cols;i=o?0:i;var n=e.size.outerWidth&&e.size.outerHeight;return this.horizontalColIndex=n?i+t:this.horizontalColIndex,{col:i,y:this._getColGroupY(i,t)}},o._manageStamp=function(t){var i=e(t),o=this._getElementOffset(t),n=this._getOption("originLeft"),s=n?o.left:o.right,r=s+i.outerWidth,a=Math.floor(s/this.columnWidth);a=Math.max(0,a);var u=Math.floor(r/this.columnWidth);u-=r%this.columnWidth?0:1,u=Math.min(this.cols-1,u);for(var h=this._getOption("originTop"),d=(h?o.top:o.bottom)+i.outerHeight,l=a;l<=u;l++)this.colYs[l]=Math.max(d,this.colYs[l])},o._getContainerSize=function(){this.maxY=Math.max.apply(Math,this.colYs);var t={height:this.maxY};return this._getOption("fitWidth")&&(t.width=this._getContainerFitWidth()),t},o._getContainerFitWidth=function(){for(var t=0,e=this.cols;--e&&0===this.colYs[e];)t++;return(this.cols-t)*this.columnWidth-this.gutter},o.needsResizeLayout=function(){var t=this.containerWidth;return this.getContainerWidth(),t!=this.containerWidth},i}),function(t,e){"function"==typeof define&&define.amd?define("isotope-layout/js/layout-modes/masonry",["../layout-mode","masonry-layout/masonry"],e):"object"==typeof module&&module.exports?module.exports=e(require("../layout-mode"),require("masonry-layout")):e(t.Isotope.LayoutMode,t.Masonry)}(window,function(t,e){"use strict";var i=t.create("masonry"),o=i.prototype,n={_getElementOffset:!0,layout:!0,_getMeasurement:!0};for(var s in e.prototype)n[s]||(o[s]=e.prototype[s]);var r=o.measureColumns;o.measureColumns=function(){this.items=this.isotope.filteredItems,r.call(this)};var a=o._getOption;return o._getOption=function(t){return"fitWidth"==t?void 0!==this.options.isFitWidth?this.options.isFitWidth:this.options.fitWidth:a.apply(this.isotope,arguments)},i}),function(t,e){"function"==typeof define&&define.amd?define("isotope-layout/js/layout-modes/fit-rows",["../layout-mode"],e):"object"==typeof exports?module.exports=e(require("../layout-mode")):e(t.Isotope.LayoutMode)}(window,function(t){"use strict";var e=t.create("fitRows"),i=e.prototype;return i._resetLayout=function(){this.x=0,this.y=0,this.maxY=0,this._getMeasurement("gutter","outerWidth")},i._getItemLayoutPosition=function(t){t.getSize();var e=t.size.outerWidth+this.gutter,i=this.isotope.size.innerWidth+this.gutter;0!==this.x&&e+this.x>i&&(this.x=0,this.y=this.maxY);var o={x:this.x,y:this.y};return this.maxY=Math.max(this.maxY,this.y+t.size.outerHeight),this.x+=e,o},i._getContainerSize=function(){return{height:this.maxY}},e}),function(t,e){"function"==typeof define&&define.amd?define("isotope-layout/js/layout-modes/vertical",["../layout-mode"],e):"object"==typeof module&&module.exports?module.exports=e(require("../layout-mode")):e(t.Isotope.LayoutMode)}(window,function(t){"use strict";var e=t.create("vertical",{horizontalAlignment:0}),i=e.prototype;return i._resetLayout=function(){this.y=0},i._getItemLayoutPosition=function(t){t.getSize();var e=(this.isotope.size.innerWidth-t.size.outerWidth)*this.options.horizontalAlignment,i=this.y;return this.y+=t.size.outerHeight,{x:e,y:i}},i._getContainerSize=function(){return{height:this.y}},e}),function(t,e){"function"==typeof define&&define.amd?define(["outlayer/outlayer","get-size/get-size","desandro-matches-selector/matches-selector","fizzy-ui-utils/utils","isotope-layout/js/item","isotope-layout/js/layout-mode","isotope-layout/js/layout-modes/masonry","isotope-layout/js/layout-modes/fit-rows","isotope-layout/js/layout-modes/vertical"],function(i,o,n,s,r,a){return e(t,i,o,n,s,r,a)}):"object"==typeof module&&module.exports?module.exports=e(t,require("outlayer"),require("get-size"),require("desandro-matches-selector"),require("fizzy-ui-utils"),require("isotope-layout/js/item"),require("isotope-layout/js/layout-mode"),require("isotope-layout/js/layout-modes/masonry"),require("isotope-layout/js/layout-modes/fit-rows"),require("isotope-layout/js/layout-modes/vertical")):t.Isotope=e(t,t.Outlayer,t.getSize,t.matchesSelector,t.fizzyUIUtils,t.Isotope.Item,t.Isotope.LayoutMode)}(window,function(t,e,i,o,n,s,r){function a(t,e){return function(i,o){for(var n=0;n<t.length;n++){var s=t[n],r=i.sortData[s],a=o.sortData[s];if(r>a||r<a){var u=void 0!==e[s]?e[s]:e,h=u?1:-1;return(r>a?1:-1)*h}}return 0}}var u=t.jQuery,h=String.prototype.trim?function(t){return t.trim()}:function(t){return t.replace(/^\s+|\s+$/g,"")},d=e.create("isotope",{layoutMode:"masonry",isJQueryFiltering:!0,sortAscending:!0});d.Item=s,d.LayoutMode=r;var l=d.prototype;l._create=function(){this.itemGUID=0,this._sorters={},this._getSorters(),e.prototype._create.call(this),this.modes={},this.filteredItems=this.items,this.sortHistory=["original-order"];for(var t in r.modes)this._initLayoutMode(t)},l.reloadItems=function(){this.itemGUID=0,e.prototype.reloadItems.call(this)},l._itemize=function(){for(var t=e.prototype._itemize.apply(this,arguments),i=0;i<t.length;i++){var o=t[i];o.id=this.itemGUID++}return this._updateItemsSortData(t),t},l._initLayoutMode=function(t){var e=r.modes[t],i=this.options[t]||{};this.options[t]=e.options?n.extend(e.options,i):i,this.modes[t]=new e(this)},l.layout=function(){return!this._isLayoutInited&&this._getOption("initLayout")?void this.arrange():void this._layout()},l._layout=function(){var t=this._getIsInstant();this._resetLayout(),this._manageStamps(),this.layoutItems(this.filteredItems,t),this._isLayoutInited=!0},l.arrange=function(t){this.option(t),this._getIsInstant();var e=this._filter(this.items);this.filteredItems=e.matches,this._bindArrangeComplete(),this._isInstant?this._noTransition(this._hideReveal,[e]):this._hideReveal(e),this._sort(),this._layout()},l._init=l.arrange,l._hideReveal=function(t){this.reveal(t.needReveal),this.hide(t.needHide)},l._getIsInstant=function(){var t=this._getOption("layoutInstant"),e=void 0!==t?t:!this._isLayoutInited;return this._isInstant=e,e},l._bindArrangeComplete=function(){function t(){e&&i&&o&&n.dispatchEvent("arrangeComplete",null,[n.filteredItems])}var e,i,o,n=this;this.once("layoutComplete",function(){e=!0,t()}),this.once("hideComplete",function(){i=!0,t()}),this.once("revealComplete",function(){o=!0,t()})},l._filter=function(t){var e=this.options.filter;e=e||"*";for(var i=[],o=[],n=[],s=this._getFilterTest(e),r=0;r<t.length;r++){var a=t[r];if(!a.isIgnored){var u=s(a);u&&i.push(a),u&&a.isHidden?o.push(a):u||a.isHidden||n.push(a)}}return{matches:i,needReveal:o,needHide:n}},l._getFilterTest=function(t){return u&&this.options.isJQueryFiltering?function(e){return u(e.element).is(t);
+}:"function"==typeof t?function(e){return t(e.element)}:function(e){return o(e.element,t)}},l.updateSortData=function(t){var e;t?(t=n.makeArray(t),e=this.getItems(t)):e=this.items,this._getSorters(),this._updateItemsSortData(e)},l._getSorters=function(){var t=this.options.getSortData;for(var e in t){var i=t[e];this._sorters[e]=f(i)}},l._updateItemsSortData=function(t){for(var e=t&&t.length,i=0;e&&i<e;i++){var o=t[i];o.updateSortData()}};var f=function(){function t(t){if("string"!=typeof t)return t;var i=h(t).split(" "),o=i[0],n=o.match(/^\[(.+)\]$/),s=n&&n[1],r=e(s,o),a=d.sortDataParsers[i[1]];return t=a?function(t){return t&&a(r(t))}:function(t){return t&&r(t)}}function e(t,e){return t?function(e){return e.getAttribute(t)}:function(t){var i=t.querySelector(e);return i&&i.textContent}}return t}();d.sortDataParsers={parseInt:function(t){return parseInt(t,10)},parseFloat:function(t){return parseFloat(t)}},l._sort=function(){if(this.options.sortBy){var t=n.makeArray(this.options.sortBy);this._getIsSameSortBy(t)||(this.sortHistory=t.concat(this.sortHistory));var e=a(this.sortHistory,this.options.sortAscending);this.filteredItems.sort(e)}},l._getIsSameSortBy=function(t){for(var e=0;e<t.length;e++)if(t[e]!=this.sortHistory[e])return!1;return!0},l._mode=function(){var t=this.options.layoutMode,e=this.modes[t];if(!e)throw new Error("No layout mode: "+t);return e.options=this.options[t],e},l._resetLayout=function(){e.prototype._resetLayout.call(this),this._mode()._resetLayout()},l._getItemLayoutPosition=function(t){return this._mode()._getItemLayoutPosition(t)},l._manageStamp=function(t){this._mode()._manageStamp(t)},l._getContainerSize=function(){return this._mode()._getContainerSize()},l.needsResizeLayout=function(){return this._mode().needsResizeLayout()},l.appended=function(t){var e=this.addItems(t);if(e.length){var i=this._filterRevealAdded(e);this.filteredItems=this.filteredItems.concat(i)}},l.prepended=function(t){var e=this._itemize(t);if(e.length){this._resetLayout(),this._manageStamps();var i=this._filterRevealAdded(e);this.layoutItems(this.filteredItems),this.filteredItems=i.concat(this.filteredItems),this.items=e.concat(this.items)}},l._filterRevealAdded=function(t){var e=this._filter(t);return this.hide(e.needHide),this.reveal(e.matches),this.layoutItems(e.matches,!0),e.matches},l.insert=function(t){var e=this.addItems(t);if(e.length){var i,o,n=e.length;for(i=0;i<n;i++)o=e[i],this.element.appendChild(o.element);var s=this._filter(e).matches;for(i=0;i<n;i++)e[i].isLayoutInstant=!0;for(this.arrange(),i=0;i<n;i++)delete e[i].isLayoutInstant;this.reveal(s)}};var c=l.remove;return l.remove=function(t){t=n.makeArray(t);var e=this.getItems(t);c.call(this,t);for(var i=e&&e.length,o=0;i&&o<i;o++){var s=e[o];n.removeFrom(this.filteredItems,s)}},l.shuffle=function(){for(var t=0;t<this.items.length;t++){var e=this.items[t];e.sortData.random=Math.random()}this.options.sortBy="random",this._sort(),this._layout()},l._noTransition=function(t,e){var i=this.options.transitionDuration;this.options.transitionDuration=0;var o=t.apply(this,e);return this.options.transitionDuration=i,o},l.getFilteredItemElements=function(){return this.filteredItems.map(function(t){return t.element})},d});
diff --git a/js/mathjax-config.js b/js/mathjax-config.js
new file mode 100644
index 00000000..2f039fdc
--- /dev/null
+++ b/js/mathjax-config.js
@@ -0,0 +1,22 @@
+// MathJax Configuration
+//
+// v2 to v3 upgrade notes:
+// - The CommonHTML.linebreaks option is not yet implemented (but may be in a future release)
+// - The TeX.noUndefined.attributes option is not yet implemented (but may be in a future release)
+window.MathJax = {
+  tex: {
+    inlineMath: [
+      ['$', '$'],
+      ['\\(', '\\)'],
+    ],
+    displayMath: [
+      ['$$', '$$'],
+      ['\\[', '\\]'],
+    ],
+    processEscapes: false,
+    packages: {'[+]': ['noerrors']},
+  },
+  loader: {
+    load: ['[tex]/noerrors'],
+  },
+};
diff --git a/js/script.min.js b/js/script.min.js
new file mode 100644
index 00000000..0da75db6
--- /dev/null
+++ b/js/script.min.js
@@ -0,0 +1 @@
+(function(e){"use strict";e(window).on("load",function(){e(".preloader").fadeOut(100)}),e("[data-background]").each(function(){e(this).css({"background-image":"url("+e(this).data("background")+")"})}),e("#searchOpen").on("click",function(){e(".search-wrapper").addClass("open"),setTimeout(function(){e(".search-box").focus()},400)}),e("#searchClose").on("click",function(){e(".search-wrapper").removeClass("open")}),e(".hero-slider").slick({autoplay:!0,infinite:!0,arrows:!0,prevArrow:"<button type='button' class='prevArrow'></button>",nextArrow:"<button type='button' class='nextArrow'></button>",dots:!1,autoplaySpeed:7500,pauseOnFocus:!1,pauseOnHover:!1}),e(".hero-slider").slickAnimation();function t(){var t;e(".count").length!==0&&(t=e(".count").offset().top-window.innerHeight),e(window).scrollTop()>t&&e(".count").each(function(){var t=e(this),n=t.attr("data-count");e({countNum:t.text()}).animate({countNum:n},{duration:1e3,easing:"swing",step:function(){t.text(Math.floor(this.countNum))},complete:function(){t.text(this.countNum)}})})}e(window).on("scroll",function(){t()}),e(".venobox").venobox(),e(".testimonial-slider").slick({slidesToShow:1,slidesToScroll:1,autoplay:!0,autoplaySpeed:6e3,dots:!1,arrows:!0,prevArrow:"<button type='button' class='prevArrow'></button>",nextArrow:"<button type='button' class='nextArrow'></button>",pauseOnFocus:!1,pauseOnHover:!1}),e(document).ready(function(){var n,t=document.querySelector(".filtr-container");t&&(n=e(".filtr-container").filterizr({})),e(".filter-controls li").on("click",function(){e(".filter-controls li").removeClass("active"),e(this).addClass("active")})}),e(".collapse").on("shown.bs.collapse",function(){e(this).parent().find(".fa-plus").removeClass("fa-plus").addClass("fa-minus")}).on("hidden.bs.collapse",function(){e(this).parent().find(".fa-minus").removeClass("fa-minus").addClass("fa-plus")})})(jQuery)
\ No newline at end of file
diff --git a/js/wowchemy-animation.js b/js/wowchemy-animation.js
new file mode 100644
index 00000000..3a665655
--- /dev/null
+++ b/js/wowchemy-animation.js
@@ -0,0 +1,22 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Wowchemy Animation
+ **************************************************/
+
+function fadeIn(element, duration = 600) {
+  element.style.display = '';
+  element.style.opacity = '0';
+  let last = +new Date();
+  let tick = function () {
+    element.style.opacity = (+element.style.opacity + (new Date() - last) / duration).toString();
+    last = +new Date();
+    if (+element.style.opacity < 1) {
+      (window.requestAnimationFrame && requestAnimationFrame(tick)) || setTimeout(tick, 16);
+    }
+  };
+  tick();
+}
+
+export {fadeIn};
diff --git a/js/wowchemy-init.js b/js/wowchemy-init.js
new file mode 100644
index 00000000..670b737d
--- /dev/null
+++ b/js/wowchemy-init.js
@@ -0,0 +1,32 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Wowchemy Initialization
+ **************************************************/
+
+import {initThemeVariation} from './wowchemy-theming';
+
+import {wcDarkLightEnabled, wcIsSiteThemeDark} from '@params';
+
+window.wc = {
+  darkLightEnabled: wcDarkLightEnabled,
+  isSiteThemeDark: wcIsSiteThemeDark,
+};
+
+// CMS authentication
+if (window.netlifyIdentity) {
+  window.netlifyIdentity.on('init', (user) => {
+    if (!user) {
+      window.netlifyIdentity.on('login', () => {
+        document.location.href = '/admin/';
+      });
+    }
+  });
+}
+
+// Initialize theme variation and set body theme class.
+initThemeVariation();
+
+// For Plotly compatibility with MathJax (must appear prior to loading Plotly).
+window.PlotlyConfig = {MathJaxConfig: 'local'};
diff --git a/js/wowchemy-search.js b/js/wowchemy-search.js
new file mode 100644
index 00000000..c5b07de8
--- /dev/null
+++ b/js/wowchemy-search.js
@@ -0,0 +1,206 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  In-built Fuse based search algorithm.
+ **************************************************/
+
+import {search_config, i18n, content_type} from '@params';
+
+/* ---------------------------------------------------------------------------
+ * Configuration.
+ * --------------------------------------------------------------------------- */
+
+// Configure Fuse.
+let fuseOptions = {
+  shouldSort: true,
+  includeMatches: true,
+  tokenize: true,
+  threshold: search_config.threshold, // Set to ~0.3 for parsing diacritics and CJK languages.
+  location: 0,
+  distance: 100,
+  maxPatternLength: 32,
+  minMatchCharLength: search_config.minLength, // Set to 1 for parsing CJK languages.
+  keys: [
+    {name: 'title', weight: 0.99} /* 1.0 doesn't work o_O */,
+    {name: 'summary', weight: 0.6},
+    {name: 'authors', weight: 0.5},
+    {name: 'content', weight: 0.2},
+    {name: 'tags', weight: 0.5},
+    {name: 'categories', weight: 0.5},
+  ],
+};
+
+// Configure summary.
+let summaryLength = 60;
+
+/* ---------------------------------------------------------------------------
+ * Functions.
+ * --------------------------------------------------------------------------- */
+
+// Get query from URI.
+function getSearchQuery(name) {
+  return decodeURIComponent((location.search.split(name + '=')[1] || '').split('&')[0]).replace(/\+/g, ' ');
+}
+
+// Set query in URI without reloading the page.
+function updateURL(url) {
+  if (history.replaceState) {
+    window.history.replaceState({path: url}, '', url);
+  }
+}
+
+// Pre-process new search query.
+function initSearch(force, fuse) {
+  let query = $('#search-query').val();
+
+  // If query deleted, clear results.
+  if (query.length < 1) {
+    $('#search-hits').empty();
+    $('#search-common-queries').show();
+  }
+
+  // Check for timer event (enter key not pressed) and query less than minimum length required.
+  if (!force && query.length < fuseOptions.minMatchCharLength) return;
+
+  // Do search.
+  $('#search-hits').empty();
+  $('#search-common-queries').hide();
+  searchAcademic(query, fuse);
+  let newURL =
+    window.location.protocol +
+    '//' +
+    window.location.host +
+    window.location.pathname +
+    '?q=' +
+    encodeURIComponent(query) +
+    window.location.hash;
+  updateURL(newURL);
+}
+
+// Perform search.
+function searchAcademic(query, fuse) {
+  let results = fuse.search(query);
+  // console.log({"results": results});
+
+  if (results.length > 0) {
+    $('#search-hits').append('<h3 class="mt-0">' + results.length + ' ' + i18n.results + '</h3>');
+    parseResults(query, results);
+  } else {
+    $('#search-hits').append('<div class="search-no-results">' + i18n.no_results + '</div>');
+  }
+}
+
+// Parse search results.
+function parseResults(query, results) {
+  $.each(results, function (key, value) {
+    let content_key = value.item.section;
+    let content = '';
+    let snippet = '';
+    let snippetHighlights = [];
+
+    // Show abstract in results for content types where the abstract is often the primary content.
+    if (['publication', 'event'].includes(content_key)) {
+      content = value.item.summary;
+    } else {
+      content = value.item.content;
+    }
+
+    if (fuseOptions.tokenize) {
+      snippetHighlights.push(query);
+    } else {
+      $.each(value.matches, function (matchKey, matchValue) {
+        if (matchValue.key == 'content') {
+          let start = matchValue.indices[0][0] - summaryLength > 0 ? matchValue.indices[0][0] - summaryLength : 0;
+          let end =
+            matchValue.indices[0][1] + summaryLength < content.length
+              ? matchValue.indices[0][1] + summaryLength
+              : content.length;
+          snippet += content.substring(start, end);
+          snippetHighlights.push(
+            matchValue.value.substring(
+              matchValue.indices[0][0],
+              matchValue.indices[0][1] - matchValue.indices[0][0] + 1,
+            ),
+          );
+        }
+      });
+    }
+
+    if (snippet.length < 1) {
+      snippet += value.item.summary; // Alternative fallback: `content.substring(0, summaryLength*2);`
+    }
+
+    // Load template.
+    let template = $('#search-hit-fuse-template').html();
+
+    // Localize content types.
+    if (content_key in content_type) {
+      content_key = content_type[content_key];
+    }
+
+    // Parse template.
+    let templateData = {
+      key: key,
+      title: value.item.title,
+      type: content_key,
+      relpermalink: value.item.relpermalink,
+      snippet: snippet,
+    };
+    let output = render(template, templateData);
+    $('#search-hits').append(output);
+
+    // Highlight search terms in result.
+    $.each(snippetHighlights, function (hlKey, hlValue) {
+      $('#summary-' + key).mark(hlValue);
+    });
+  });
+}
+
+function render(template, data) {
+  // Replace placeholders with their values.
+  let key, find, re;
+  for (key in data) {
+    find = '\\{\\{\\s*' + key + '\\s*\\}\\}'; // Expect placeholder in the form `{{x}}`.
+    re = new RegExp(find, 'g');
+    template = template.replace(re, data[key]);
+  }
+  return template;
+}
+
+/* ---------------------------------------------------------------------------
+ * Initialize.
+ * --------------------------------------------------------------------------- */
+
+// If Academic's in-built search is enabled and Fuse loaded, then initialize it.
+if (typeof Fuse === 'function') {
+  // Wait for Fuse to initialize.
+  $.getJSON(search_config.indexURI, function (search_index) {
+    let fuse = new Fuse(search_index, fuseOptions);
+
+    // On page load, check for search query in URL.
+    let query = getSearchQuery('q');
+    if (query) {
+      $('body').addClass('searching');
+      $('.search-results').css({opacity: 0, visibility: 'visible'}).animate({opacity: 1}, 200);
+      $('#search-query').val(query);
+      $('#search-query').focus();
+      initSearch(true, fuse);
+    }
+
+    // On search box key up, process query.
+    $('#search-query').keyup(function (e) {
+      clearTimeout($.data(this, 'searchTimer')); // Ensure only one timer runs!
+      if (e.keyCode == 13) {
+        initSearch(true, fuse);
+      } else {
+        $(this).data(
+          'searchTimer',
+          setTimeout(function () {
+            initSearch(false, fuse);
+          }, 250),
+        );
+      }
+    });
+  });
+}
diff --git a/js/wowchemy-slides.js b/js/wowchemy-slides.js
new file mode 100644
index 00000000..c465dfc7
--- /dev/null
+++ b/js/wowchemy-slides.js
@@ -0,0 +1,148 @@
+/*
+  global RevealMarkdown, RevealHighlight, RevealSearch, RevealNotes, RevealMath, RevealZoom, Reveal, mermaid, RevealMenu
+*/
+
+import * as params from '@params';
+
+import {fixMermaid} from './wowchemy-utils';
+
+// Enable core slide features.
+var enabledPlugins = [RevealMarkdown, RevealHighlight, RevealSearch, RevealNotes, RevealMath, RevealZoom];
+
+const isObject = function (o) {
+  return o === Object(o) && !isArray(o) && typeof o !== 'function';
+};
+
+const isArray = function (a) {
+  return Array.isArray(a);
+};
+
+const toCamelCase = function (s) {
+  return s.replace(/([-_][a-z])/gi, function (term) {
+    return term.toUpperCase().replace('-', '').replace('_', '');
+  });
+};
+
+const keysToCamelCase = function (o) {
+  if (isObject(o)) {
+    const n = {};
+
+    Object.keys(o).forEach(function (k) {
+      n[toCamelCase(k)] = keysToCamelCase(o[k]);
+    });
+
+    return n;
+  } else if (isArray(o)) {
+    return o.map(function (i) {
+      return keysToCamelCase(i);
+    });
+  }
+
+  return o;
+};
+
+// reveal configurations can be included in front matter under slides.reveal
+var pluginOptions = {};
+if (typeof params.slides.reveal_options !== 'undefined') {
+  pluginOptions = params.slides.reveal_options;
+}
+
+pluginOptions = keysToCamelCase(pluginOptions);
+
+//enable menu by default if not set
+if (typeof pluginOptions.menu_enabled === 'undefined') {
+  pluginOptions.menu_enabled = true;
+}
+
+// configure menu if enabled
+if (pluginOptions.menu_enabled) {
+  enabledPlugins.push(RevealMenu);
+}
+
+pluginOptions['plugins'] = enabledPlugins;
+
+Reveal.initialize(pluginOptions);
+
+// The following functions are used to render Mermaid diagrams
+// after Reveal slides have been successfully loaded
+// since content of slides is lazy loaded, if diagrams are
+// rendered at start of presentation their sizes will be off
+// get all slides that are:
+// 1- data loaded
+// 2- display set to block
+// 3- has a mermaid element that is not processed (data-processed dne)
+function mermaidSlidesReadyToRender(mslide) {
+  var diag = mslide.querySelector('.mermaid');
+  if (diag) {
+    var background = mslide.slideBackgroundElement;
+    // render if we are 1 slide away horizontally
+    // current visible slide index
+    var currentHorizontalIndex = Reveal.getState()['indexh'];
+
+    // mermaid slide index
+    var diagramSlideIndex = Reveal.getIndices(mslide)['h'];
+    if (
+      // find slides with non-rendered mermaid tags
+      // these will not have the attribute data-processed
+      !diag.hasAttribute('data-processed') &&
+      // check also that reveal slide is already loaded
+      // reveal slides seem to be lazily loaded
+      // things could be easier if reveal had a slide-loaded event
+      background.hasAttribute('data-loaded') &&
+      // loaded slides must also have the display attribute set to block
+      background.style.display === 'block' &&
+      // render diagrams that are 1 slide away
+      diagramSlideIndex - currentHorizontalIndex <= 1
+    )
+      return mslide;
+  }
+  return null;
+}
+
+function renderMermaidSlides() {
+  // find all slides with diagrams that are ready to render
+  var diagramSlides = Reveal.getSlides().filter(mermaidSlidesReadyToRender);
+
+  // render the diagram for each slide with ready to render diagrams
+  diagramSlides.forEach(function (item) {
+    mermaid.init(item.querySelector('.mermaid'));
+  });
+}
+
+// render mermaid slides for slides that are ready
+Reveal.on('slidechanged', function () {
+  renderMermaidSlides();
+});
+
+// render mermaid slides for slides that are ready on startup
+Reveal.on('Ready', function () {
+  if (Reveal.isReady()) {
+    renderMermaidSlides();
+  }
+});
+
+// Disable Mermaid by default.
+if (typeof params.slides.diagram === 'undefined') {
+  params.slides.diagram = false;
+}
+
+// Configure Mermaid only if diagrams are enabled.
+if (params.slides.diagram) {
+  //mermaid options
+  // mermaid: front matter configuration can be used to set mermaid options
+  // You can also use directives (see mermaid documentation)
+  var mermaidOptions = {};
+  if (typeof params.slides.diagram_options !== 'undefined') {
+    mermaidOptions = params.slides.diagram_options;
+  }
+
+  // `startOnLoad` must be false since diagrams are lazily rendered.
+  mermaidOptions['startOnLoad'] = false;
+
+  mermaid.initialize(mermaidOptions);
+
+  // Fix Mermaid conflict with Hightlight JS.
+  document.addEventListener('DOMContentLoaded', function () {
+    fixMermaid(false);
+  });
+}
diff --git a/js/wowchemy-theming.js b/js/wowchemy-theming.js
new file mode 100644
index 00000000..2e9e7d43
--- /dev/null
+++ b/js/wowchemy-theming.js
@@ -0,0 +1,269 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Wowchemy Theming System
+ *  Supported Modes: {0: Light, 1: Dark, 2: Auto}
+ **************************************************/
+
+import {fadeIn} from './wowchemy-animation';
+import {fixMermaid} from './wowchemy-utils';
+
+const body = document.body;
+
+function getThemeMode() {
+  return parseInt(localStorage.getItem('wcTheme') || 2);
+}
+
+function canChangeTheme() {
+  // If var is set, then user is allowed to change the theme variation.
+  return Boolean(window.wc.darkLightEnabled);
+}
+
+// initThemeVariation is first called directly after <body> to prevent
+// flashing between the default theme mode and the user's choice.
+function initThemeVariation() {
+  if (!canChangeTheme()) {
+    console.debug('User theming disabled.');
+    return {
+      isDarkTheme: window.wc.isSiteThemeDark,
+      themeMode: window.wc.isSiteThemeDark ? 1 : 0,
+    };
+  }
+
+  console.debug('User theming enabled.');
+
+  let isDarkTheme;
+  let currentThemeMode = getThemeMode();
+  console.debug(`User's theme variation: ${currentThemeMode}`);
+
+  switch (currentThemeMode) {
+    case 0:
+      isDarkTheme = false;
+      break;
+    case 1:
+      isDarkTheme = true;
+      break;
+    default:
+      if (window.matchMedia('(prefers-color-scheme: dark)').matches) {
+        // The visitor prefers dark themes and switching to the dark variation is allowed by admin.
+        isDarkTheme = true;
+      } else if (window.matchMedia('(prefers-color-scheme: light)').matches) {
+        // The visitor prefers light themes and switching to the light variation is allowed by admin.
+        isDarkTheme = false;
+      } else {
+        // Use the site's default theme variation based on `light` in the theme file.
+        isDarkTheme = window.wc.isSiteThemeDark;
+      }
+      break;
+  }
+
+  if (isDarkTheme && !body.classList.contains('dark')) {
+    console.debug('Applying Wowchemy dark theme');
+    document.body.classList.add('dark');
+  } else if (!isDarkTheme && body.classList.contains('dark')) {
+    console.debug('Applying Wowchemy light theme');
+    document.body.classList.remove('dark');
+  }
+
+  return {
+    isDarkTheme: isDarkTheme,
+    themeMode: currentThemeMode,
+  };
+}
+
+function changeThemeModeClick(newMode) {
+  if (!canChangeTheme()) {
+    console.debug('Cannot change theme - user theming disabled.');
+    return;
+  }
+  let isDarkTheme;
+  switch (newMode) {
+    case 0:
+      localStorage.setItem('wcTheme', '0');
+      isDarkTheme = false;
+      console.debug('User changed theme variation to Light.');
+      break;
+    case 1:
+      localStorage.setItem('wcTheme', '1');
+      isDarkTheme = true;
+      console.debug('User changed theme variation to Dark.');
+      break;
+    default:
+      localStorage.setItem('wcTheme', '2');
+      if (window.matchMedia('(prefers-color-scheme: dark)').matches) {
+        // The visitor prefers dark themes and switching to the dark variation is allowed by admin.
+        isDarkTheme = true;
+      } else if (window.matchMedia('(prefers-color-scheme: light)').matches) {
+        // The visitor prefers light themes and switching to the light variation is allowed by admin.
+        isDarkTheme = false;
+      } else {
+        // Use the site's default theme variation based on `light` in the theme file.
+        isDarkTheme = window.wc.isSiteThemeDark;
+      }
+      console.debug('User changed theme variation to Auto.');
+      break;
+  }
+  renderThemeVariation(isDarkTheme, newMode);
+}
+
+function showActiveTheme(mode) {
+  let linkLight = document.querySelector('.js-set-theme-light');
+  let linkDark = document.querySelector('.js-set-theme-dark');
+  let linkAuto = document.querySelector('.js-set-theme-auto');
+
+  if (linkLight === null) {
+    return;
+  }
+
+  switch (mode) {
+    case 0:
+      // Light.
+      linkLight.classList.add('dropdown-item-active');
+      linkDark.classList.remove('dropdown-item-active');
+      linkAuto.classList.remove('dropdown-item-active');
+      break;
+    case 1:
+      // Dark.
+      linkLight.classList.remove('dropdown-item-active');
+      linkDark.classList.add('dropdown-item-active');
+      linkAuto.classList.remove('dropdown-item-active');
+      break;
+    default:
+      // Auto.
+      linkLight.classList.remove('dropdown-item-active');
+      linkDark.classList.remove('dropdown-item-active');
+      linkAuto.classList.add('dropdown-item-active');
+      break;
+  }
+}
+
+/**
+ * Render theme variation (day or night).
+ *
+ * @param {boolean} isDarkTheme
+ * @param {int} themeMode - {0: Light, 1: Dark, 2: Auto}
+ * @param {boolean} init - true only when called on document ready
+ * @returns {undefined}
+ */
+function renderThemeVariation(isDarkTheme, themeMode = 2, init = false) {
+  // Is code highlighting enabled in site config?
+  const codeHlLight = document.querySelector('link[title=hl-light]');
+  const codeHlDark = document.querySelector('link[title=hl-dark]');
+  const codeHlEnabled = codeHlLight !== null || codeHlDark !== null;
+  const diagramEnabled = document.querySelector('script[title=mermaid]') !== null;
+
+  // Update active theme mode in navbar theme selector.
+  showActiveTheme(themeMode);
+
+  // Dispatch `wcThemeChange` event to support themeable user plugins.
+  const themeChangeEvent = new CustomEvent('wcThemeChange', {detail: {isDarkTheme: () => isDarkTheme}});
+  document.dispatchEvent(themeChangeEvent);
+
+  // Check if re-render required.
+  if (!init) {
+    // If request to render light when light variation already rendered, return.
+    // If request to render dark when dark variation already rendered, return.
+    if (
+      (isDarkTheme === false && !body.classList.contains('dark')) ||
+      (isDarkTheme === true && body.classList.contains('dark'))
+    ) {
+      return;
+    }
+  }
+
+  if (isDarkTheme === false) {
+    if (!init) {
+      // Only fade in the page when changing the theme variation.
+      Object.assign(document.body.style, {opacity: 0, visibility: 'visible'});
+      fadeIn(document.body, 600);
+    }
+    body.classList.remove('dark');
+    if (codeHlEnabled) {
+      console.debug('Setting HLJS theme to light');
+      if (codeHlLight) {
+        codeHlLight.disabled = false;
+      }
+      if (codeHlDark) {
+        codeHlDark.disabled = true;
+      }
+    }
+    if (diagramEnabled) {
+      console.debug('Initializing Mermaid with light theme');
+      if (init) {
+        /** @namespace window.mermaid **/
+        window.mermaid.initialize({startOnLoad: false, theme: 'default', securityLevel: 'loose'});
+        fixMermaid(true);
+      } else {
+        // Have to reload to re-initialise Mermaid with the new theme and re-parse the Mermaid code blocks.
+        location.reload();
+      }
+    }
+  } else if (isDarkTheme === true) {
+    if (!init) {
+      // Only fade in the page when changing the theme variation.
+      Object.assign(document.body.style, {opacity: 0, visibility: 'visible'});
+      fadeIn(document.body, 600);
+    }
+    body.classList.add('dark');
+    if (codeHlEnabled) {
+      console.debug('Setting HLJS theme to dark');
+      if (codeHlLight) {
+        codeHlLight.disabled = true;
+      }
+      if (codeHlDark) {
+        codeHlDark.disabled = false;
+      }
+    }
+    if (diagramEnabled) {
+      console.debug('Initializing Mermaid with dark theme');
+      if (init) {
+        /** @namespace window.mermaid **/
+        window.mermaid.initialize({startOnLoad: false, theme: 'dark', securityLevel: 'loose'});
+        fixMermaid(true);
+      } else {
+        // Have to reload to re-initialise Mermaid with the new theme and re-parse the Mermaid code blocks.
+        location.reload();
+      }
+    }
+  }
+}
+
+/**
+ * onMediaQueryListEvent.
+ *
+ * @param {MediaQueryListEvent} event
+ * @returns {undefined}
+ */
+function onMediaQueryListEvent(event) {
+  if (!canChangeTheme()) {
+    // Changing theme variation is not allowed by admin.
+    return;
+  }
+  const darkModeOn = event.matches;
+  console.debug(`OS dark mode preference changed to ${darkModeOn ? '🌒 on' : '☀️ off'}.`);
+  let currentThemeVariation = getThemeMode();
+  let isDarkTheme;
+  if (currentThemeVariation === 2) {
+    if (window.matchMedia('(prefers-color-scheme: dark)').matches) {
+      // The visitor prefers dark themes.
+      isDarkTheme = true;
+    } else if (window.matchMedia('(prefers-color-scheme: light)').matches) {
+      // The visitor prefers light themes.
+      isDarkTheme = false;
+    } else {
+      // The visitor does not have a day or night preference, so use the theme's default setting.
+      isDarkTheme = window.wc.isSiteThemeDark;
+    }
+    renderThemeVariation(isDarkTheme, currentThemeVariation);
+  }
+}
+
+export {
+  canChangeTheme,
+  initThemeVariation,
+  changeThemeModeClick,
+  renderThemeVariation,
+  getThemeMode,
+  onMediaQueryListEvent,
+};
diff --git a/js/wowchemy-utils.js b/js/wowchemy-utils.js
new file mode 100644
index 00000000..37f31323
--- /dev/null
+++ b/js/wowchemy-utils.js
@@ -0,0 +1,61 @@
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Wowchemy Utilities
+ **************************************************/
+
+/**
+ * Fix Mermaid.js clash with Highlight.js.
+ * Refactor Mermaid code blocks as divs to prevent Highlight parsing them and enable Mermaid to parse them.
+ * @param {boolean} render
+ */
+function fixMermaid(render = false) {
+  let mermaids = [];
+  // Note that `language-mermaid` class is applied to <code> block within <pre>, so we wish to replace parent node.
+  [].push.apply(mermaids, document.getElementsByClassName('language-mermaid'));
+  for (let i = 0; i < mermaids.length; i++) {
+    // Convert <pre><code></code></pre> block to <div> and add `mermaid` class so that Mermaid will parse it.
+    let mermaidCodeElement = mermaids[i];
+    let newElement = document.createElement('div');
+    newElement.innerHTML = mermaidCodeElement.innerHTML;
+    newElement.classList.add('mermaid');
+    if (render) {
+      window.mermaid.mermaidAPI.render(`mermaid-${i}`, newElement.textContent, function (svgCode) {
+        newElement.innerHTML = svgCode;
+      });
+    }
+    mermaidCodeElement.parentNode.replaceWith(newElement);
+  }
+  console.debug(`Processed ${mermaids.length} Mermaid code blocks`);
+}
+
+/**
+ * @param {Element} parent
+ * @param {Element} child
+ */
+function scrollParentToChild(parent, child) {
+  // Where is the parent on the page?
+  const parentRect = parent.getBoundingClientRect();
+
+  // What can the client see?
+  const parentViewableArea = {
+    height: parent.clientHeight,
+    width: parent.clientWidth,
+  };
+
+  // Where is the child?
+  const childRect = child.getBoundingClientRect();
+
+  // Is the child in view?
+  const isChildInView =
+    childRect.top >= parentRect.top && childRect.bottom <= parentRect.top + parentViewableArea.height;
+
+  // If the child isn't in view, attempt to scroll the parent to it.
+  if (!isChildInView) {
+    // Scroll by offset relative to parent.
+    parent.scrollTop = childRect.top + parent.scrollTop - parentRect.top;
+  }
+}
+
+export {fixMermaid, scrollParentToChild};
diff --git a/js/wowchemy.js b/js/wowchemy.js
new file mode 100644
index 00000000..2a4bb3a7
--- /dev/null
+++ b/js/wowchemy.js
@@ -0,0 +1,345 @@
+
+/*************************************************
+ *  Wowchemy
+ *  https://github.com/wowchemy/wowchemy-hugo-modules
+ *
+ *  Core JS functions and initialization.
+ **************************************************/
+
+// Stripped-down version, only kept filtering
+
+/* ---------------------------------------------------------------------------
+ * Filter publications.
+ * --------------------------------------------------------------------------- */
+
+// Active publication filters.
+let pubFilters = {};
+
+// Search term.
+let searchRegex;
+
+// Filter values (concatenated).
+let filterValues;
+
+// Publication container.
+let $grid_pubs = $('#container-publications');
+
+// Initialise Isotope publication layout if required.
+if ($grid_pubs.length) {
+  $grid_pubs.isotope({
+    itemSelector: '.isotope-item',
+    percentPosition: true,
+    masonry: {
+      // Use Bootstrap compatible grid layout.
+      columnWidth: '.grid-sizer',
+    },
+    filter: function () {
+      let $this = $(this);
+      let searchResults = searchRegex ? $this.text().match(searchRegex) : true;
+      let filterResults = filterValues ? $this.is(filterValues) : true;
+      return searchResults && filterResults;
+    },
+  });
+
+  // Filter by search term.
+  let $quickSearch = $('.filter-search').keyup(
+    debounce(function () {
+      searchRegex = new RegExp($quickSearch.val(), 'gi');
+      $grid_pubs.isotope();
+    }),
+  );
+
+  $('.pub-filters').on('change', function () {
+    let $this = $(this);
+
+    // Get group key.
+    let filterGroup = $this[0].getAttribute('data-filter-group');
+
+    // Set filter for group.
+    pubFilters[filterGroup] = this.value;
+
+    // Combine filters.
+    filterValues = concatValues(pubFilters);
+
+    // Activate filters.
+    $grid_pubs.isotope();
+
+    // If filtering by publication type, update the URL hash to enable direct linking to results.
+    if (filterGroup === 'pubtype') {
+      // Set hash URL to current filter.
+      let url = $(this).val();
+      if (url.substr(0, 9) === '.pubtype-') {
+        window.location.hash = url.substr(9);
+      } else {
+        window.location.hash = '';
+      }
+    }
+  });
+}
+
+// Debounce input to prevent spamming filter requests.
+function debounce(fn, threshold) {
+  let timeout;
+  threshold = threshold || 100;
+  return function debounced() {
+    clearTimeout(timeout);
+    let args = arguments;
+    let _this = this;
+
+    function delayed() {
+      fn.apply(_this, args);
+    }
+
+    timeout = setTimeout(delayed, threshold);
+  };
+}
+
+// Flatten object by concatenating values.
+function concatValues(obj) {
+  let value = '';
+  for (let prop in obj) {
+    value += obj[prop];
+  }
+  return value;
+}
+
+// Filter publications according to hash in URL.
+function filter_publications() {
+  // Check for Isotope publication layout.
+  if (!$grid_pubs.length) return;
+
+  let urlHash = window.location.hash.replace('#', '');
+  let filterValue = '*';
+
+  // Check if hash is numeric.
+  if (urlHash != '' && !isNaN(urlHash)) {
+    filterValue = '.pubtype-' + urlHash;
+  }
+
+  // Set filter.
+  let filterGroup = 'pubtype';
+  pubFilters[filterGroup] = filterValue;
+  filterValues = concatValues(pubFilters);
+
+  // Activate filters.
+  $grid_pubs.isotope();
+
+  // Set selected option.
+  $('.pubtype-select').val(filterValue);
+}
+
+/* ---------------------------------------------------------------------------
+ * On window loaded.
+ * --------------------------------------------------------------------------- */
+
+$(window).on('load', function () {
+  // Re-initialize Scrollspy with dynamic navbar height offset.
+  fixScrollspy();
+
+  // Detect instances of the Portfolio widget.
+  let isotopeInstances = document.querySelectorAll('.projects-container');
+  let isotopeInstancesCount = isotopeInstances.length;
+
+  // Fix ScrollSpy highlighting previous Book page ToC link for some anchors.
+  // Check if isotopeInstancesCount>0 as that case performs its own scrollToAnchor.
+  if (window.location.hash && isotopeInstancesCount === 0) {
+    scrollToAnchor(decodeURIComponent(window.location.hash), 0);
+  }
+
+  // Scroll Book page's active ToC sidebar link into view.
+  // Action after calling scrollToAnchor to fix Scrollspy highlighting otherwise wrong link may have active class.
+  let child = document.querySelector('.docs-toc .nav-link.active');
+  let parent = document.querySelector('.docs-toc');
+  if (child && parent) {
+    scrollParentToChild(parent, child);
+  }
+
+  // Enable images to be zoomed.
+  let zoomOptions = {};
+  if (document.body.classList.contains('dark')) {
+    zoomOptions.background = 'rgba(0,0,0,0.9)';
+  } else {
+    zoomOptions.background = 'rgba(255,255,255,0.9)';
+  }
+  // mediumZoom('[data-zoomable]', zoomOptions);
+
+  // Init Isotope Layout Engine for instances of the Portfolio widget.
+  let isotopeCounter = 0;
+  isotopeInstances.forEach(function (isotopeInstance, index) {
+    console.debug(`Loading Isotope instance ${index}`);
+
+    // Isotope instance
+    let iso;
+
+    // Get the layout for this Isotope instance
+    let isoSection = isotopeInstance.closest('section');
+    let layout = '';
+    if (isoSection.querySelector('.isotope').classList.contains('js-layout-row')) {
+      layout = 'fitRows';
+    } else {
+      layout = 'masonry';
+    }
+
+    // Get default filter (if any) for this instance
+    let defaultFilter = isoSection.querySelector('.default-project-filter');
+    let filterText = '*';
+    if (defaultFilter !== null) {
+      filterText = defaultFilter.textContent;
+    }
+    console.debug(`Default Isotope filter: ${filterText}`);
+
+    // Init Isotope instance once its images have loaded.
+    imagesLoaded(isotopeInstance, function () {
+      iso = new Isotope(isotopeInstance, {
+        itemSelector: '.isotope-item',
+        layoutMode: layout,
+        masonry: {
+          gutter: 20,
+        },
+        filter: filterText,
+      });
+
+      // Filter Isotope items when a toolbar filter button is clicked.
+      let isoFilterButtons = isoSection.querySelectorAll('.project-filters a');
+      isoFilterButtons.forEach((button) =>
+        button.addEventListener('click', (e) => {
+          e.preventDefault();
+          let selector = button.getAttribute('data-filter');
+
+          // Apply filter
+          console.debug(`Updating Isotope filter to ${selector}`);
+          iso.arrange({filter: selector});
+
+          // Update active toolbar filter button
+          button.classList.remove('active');
+          button.classList.add('active');
+          let buttonSiblings = getSiblings(button);
+          buttonSiblings.forEach((buttonSibling) => {
+            buttonSibling.classList.remove('active');
+            buttonSibling.classList.remove('all');
+          });
+        }),
+      );
+
+      // Check if all Isotope instances have loaded.
+      incrementIsotopeCounter();
+    });
+  });
+
+  // Hook to perform actions once all Isotope instances have loaded.
+  function incrementIsotopeCounter() {
+    isotopeCounter++;
+    if (isotopeCounter === isotopeInstancesCount) {
+      console.debug(`All Portfolio Isotope instances loaded.`);
+      // Once all Isotope instances and their images have loaded, scroll to hash (if set).
+      // Prevents scrolling to the wrong location due to the dynamic height of Isotope instances.
+      // Each Isotope instance height is affected by applying filters and loading images.
+      // Without this logic, the scroll location can appear correct, but actually a few pixels out and hence Scrollspy
+      // can highlight the wrong nav link.
+      if (window.location.hash) {
+        scrollToAnchor(decodeURIComponent(window.location.hash), 0);
+      }
+    }
+  }
+
+  // Enable publication filter for publication index page.
+  if ($('.pub-filters-select')) {
+    filter_publications();
+    // Useful for changing hash manually (e.g. in development):
+    // window.addEventListener('hashchange', filter_publications, false);
+  }
+
+  // Load citation modal on 'Cite' click.
+  $('.js-cite-modal').click(function (e) {
+    e.preventDefault();
+    let filename = $(this).attr('data-filename');
+    let modal = $('#modal');
+    modal.find('.modal-body code').load(filename, function (response, status, xhr) {
+      if (status == 'error') {
+        let msg = 'Error: ';
+        $('#modal-error').html(msg + xhr.status + ' ' + xhr.statusText);
+      } else {
+        $('.js-download-cite').attr('href', filename);
+      }
+    });
+    modal.modal('show');
+  });
+
+  // Copy citation text on 'Copy' click.
+  $('.js-copy-cite').click(function (e) {
+    e.preventDefault();
+    // Get selection.
+    let range = document.createRange();
+    let code_node = document.querySelector('#modal .modal-body');
+    range.selectNode(code_node);
+    window.getSelection().addRange(range);
+    try {
+      // Execute the copy command.
+      document.execCommand('copy');
+    } catch (e) {
+      console.log('Error: citation copy failed.');
+    }
+    // Remove selection.
+    window.getSelection().removeRange(range);
+  });
+
+  // Initialise Google Maps if necessary.
+  // initMap();
+
+  // Print latest version of GitHub projects.
+  // // let githubReleaseSelector = '.js-github-release';
+  // // if ($(githubReleaseSelector).length > 0) {
+  // //   printLatestRelease(githubReleaseSelector, $(githubReleaseSelector).data('repo'));
+  // // }
+
+  // // Parse Wowchemy keyboard shortcuts.
+  // document.addEventListener('keyup', (event) => {
+  //   if (event.code === 'Escape') {
+  //     const body = document.body;
+  //     if (body.classList.contains('searching')) {
+  //       // Close search dialog.
+  //       toggleSearchDialog();
+  //     }
+  //   }
+  //   // Use `key` to check for slash. Otherwise, with `code` we need to check for modifiers.
+  //   if (event.key === '/') {
+  //     let focusedElement =
+  //       (document.hasFocus() &&
+  //         document.activeElement !== document.body &&
+  //         document.activeElement !== document.documentElement &&
+  //         document.activeElement) ||
+  //       null;
+  //     let isInputFocused = focusedElement instanceof HTMLInputElement || focusedElement instanceof HTMLTextAreaElement;
+  //     if (searchEnabled && !isInputFocused) {
+  //       // Open search dialog.
+  //       event.preventDefault();
+  //       toggleSearchDialog();
+  //     }
+  //   }
+  // });
+
+  // // Search event handler
+  // // Check that built-in search or Algolia enabled.
+  // if (searchEnabled) {
+  //   // On search icon click toggle search dialog.
+  //   $('.js-search').click(function (e) {
+  //     e.preventDefault();
+  //     toggleSearchDialog();
+  //   });
+  // }
+
+  // Init. author notes (tooltips).
+  $('[data-toggle="tooltip"]').tooltip();
+});
+
+
+// Make Scrollspy responsive.
+function fixScrollspy() {
+  let $body = $('body');
+  let data = $body.data('bs.scrollspy');
+  if (data) {
+    data._config.offset = getNavBarHeight();
+    $body.data('bs.scrollspy', data);
+    $body.scrollspy('refresh');
+  }
+}
diff --git a/ldbc-graphalytics-0/index.html b/ldbc-graphalytics-0/index.html
new file mode 100644
index 00000000..66b5ac71
--- /dev/null
+++ b/ldbc-graphalytics-0/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/benchmarks/graphalytics/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/benchmarks/graphalytics/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/benchmarks/graphalytics/">
+  </head>
+</html>
diff --git a/leadership/index.html b/leadership/index.html
new file mode 100644
index 00000000..e8ef8318
--- /dev/null
+++ b/leadership/index.html
@@ -0,0 +1,397 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Leadership</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Leadership</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Leadership</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<section class="section">
+  
+
+
+
+<div class="container">
+
+  <div class="row justify-content-between d-flex flex-wrap align-items-center">
+    <div class="col-md-12">
+      <div class="section-title-border"></div>
+
+      <!-- Board of Directors -->
+      <h3 class="section-title">Board of Directors</h3>
+      <h5 class="section-title">Contact: info AT ldbcouncil DOT org</h5>
+        <div class="row row-eq-height"><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.cwi.nl/people/peter-boncz" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/peter-boncz.jpg" alt="Prof. Dr. Peter Boncz (chair)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Prof. Dr. Peter Boncz (chair)
+          </a>
+          </div><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.linkedin.com/in/alastair-green-65a861a7/" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/alastair-green.jpg" alt="Alastair Green (vice-chair)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Alastair Green (vice-chair)
+          </a>
+          </div><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.linkedin.com/in/basteer/" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/ben-steer.jpg" alt="Dr. Benjamin A. Steer (audit coordinator)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Dr. Benjamin A. Steer (audit coordinator)
+          </a>
+          </div><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.linkedin.com/in/qishipeng/" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/shipeng-qi.jpg" alt="Shipeng Qi (benchmark expert)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Shipeng Qi (benchmark expert)
+          </a>
+          </div></div>
+
+      <div class="section-title-border"></div>
+      <h3 class="section-title">Administation and Task Forces</h3>
+        <div class="row row-eq-height"><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.linkedin.com/in/judy-bingham-b737001/" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/judy-bingham.jpg" alt="Judy Bingham (company secretary &amp; treasurer)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Judy Bingham (company secretary &amp; treasurer)
+          </a>
+          </div><div class="col-md-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.linkedin.com/in/szarnyasg/" style="text-align: center; padding-bottom: 25px;" >
+            <img src="https://ldbcouncil.org/images/steering-committee-pictures/gabor-szarnyas.jpg" alt="Dr. Gábor Szárnyas (SNB task force lead)" loading="lazy" class="img-fluid" style="vertical-align: middle; max-height:162px; max-width:350px; height:auto; width:auto; padding-bottom: 15px;" >
+            <br/>
+            Dr. Gábor Szárnyas (SNB task force lead)
+          </a>
+          </div></div>
+  </div>
+</div>
+
+
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/licensing/LICENSE.txt b/licensing/LICENSE.txt
new file mode 100644
index 00000000..75b52484
--- /dev/null
+++ b/licensing/LICENSE.txt
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/licensing/NOTICE.txt b/licensing/NOTICE.txt
new file mode 100644
index 00000000..d2fbb4a6
--- /dev/null
+++ b/licensing/NOTICE.txt
@@ -0,0 +1,13 @@
+ Copyright [2020-]2022 Linked Data Benchmark Council
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
\ No newline at end of file
diff --git a/licensing/ldbc-data-set-license.txt b/licensing/ldbc-data-set-license.txt
new file mode 100644
index 00000000..6da393e7
--- /dev/null
+++ b/licensing/ldbc-data-set-license.txt
@@ -0,0 +1,5 @@
+# LDBC Data set license (2022/03/15)
+
+LDBC BENCHMARK is a registered trademark of Linked Data Benchmark Council (LDBC). LDBC wishes to avoid mistaken or false claims that performance test results are LDBC benchmark test results. We are working on developing a policy on fair use of the term "LDBC benchmark" when reporting performance test results, backed up by the grant of trademark licences, or a commitment not to pursue those who follow our fair use policies for trademark infringement.
+
+In the interim, you are not licensed to refer to any presentation of the results of running benchmark tests using these data sets using the words "LDBC benchmark" or anything that is likely to be reasonably construed as being equivalent in meaning to the words "LDBC benchmark". However, if you contact LDBC at info@ldbcouncil.org then we will discuss with you a form of words to describe or characterize any test results you produce in a way that accurately states the relationship of any report, presentation or other publication of those results to LBDC benchmark results, and which will avoid the possibility of you infringing our trademark inadvertently.
diff --git a/organizational-members/index.html b/organizational-members/index.html
new file mode 100644
index 00000000..b4671dc9
--- /dev/null
+++ b/organizational-members/index.html
@@ -0,0 +1,560 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Organizational Members</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Organizational Members</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Organizational Members</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+
+<!-- members -->
+<section class="section">
+  
+
+
+<div class="container">
+
+  <div class="row justify-content-between d-flex flex-wrap align-items-center">
+    <div class="col-md-12">
+      <div class="section-title-border"></div>
+      <!-- Sponsor companies -->
+      <h3 class="section-title">Sponsor companies</h3>
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-6 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.antgroup.com/en" >
+            <img src="https://ldbcouncil.org/images/members/antgroup.png" alt="Ant Group" loading="lazy" class="img-fluid sponsor-company-logo" >
+          </a>
+          </div>
+          <div style="display: flex; align-items: center; height: 120px; font-size: 2em;">Ant Group</div>
+        
+          <div class="col-lg-6 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.volcengine.com/" >
+            <img src="https://ldbcouncil.org/images/members/volcengine.png" alt="Beijing Volcano Engine Technology Co." loading="lazy" class="img-fluid sponsor-company-logo" >
+          </a>
+          </div>
+          <div style="display: flex; align-items: center; height: 120px; font-size: 2em;">Beijing Volcano Engine Technology Co.</div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-6 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.oracle.com/" >
+            <img src="https://ldbcouncil.org/images/members/oracle-labs.png" alt="Oracle Labs" loading="lazy" class="img-fluid sponsor-company-logo" >
+          </a>
+          </div>
+          <div style="display: flex; align-items: center; height: 120px; font-size: 2em;">Oracle Labs</div>
+        
+          <div class="col-lg-6 px-0 div-wrapper d-flex justify-content-center align-items-center"></div>
+        </div>
+      
+      <div class="section-title-border"></div>
+      <!-- Member companies -->
+      <h3 class="section-title">Companies</h3>
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://alibabacloud.com/" >
+            <img src="https://ldbcouncil.org/images/members/alibaba-cloud.png" alt="Alibaba Cloud" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.arangodb.com/" >
+            <img src="https://ldbcouncil.org/images/members/arangodb.png" alt="ArangoDB" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://aws.amazon.com/" >
+            <img src="https://ldbcouncil.org/images/members/aws.png" alt="AWS" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://chuanglintech.com/" >
+            <img src="https://ldbcouncil.org/images/members/createlink.png" alt="CreateLink" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.intel.com/" >
+            <img src="https://ldbcouncil.org/images/members/fabarta.jpg" alt="Fabarta Co., Ltd." loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.intel.com/" >
+            <img src="https://ldbcouncil.org/images/members/intel.png" alt="Intel" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="http://www.jcc.com" >
+            <img src="https://ldbcouncil.org/images/members/jcc.png" alt="JCC Consulting Inc." loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://memgraph.com/" >
+            <img src="https://ldbcouncil.org/images/members/memgraph.png" alt="Memgraph" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://nebula-graph.io/" >
+            <img src="https://ldbcouncil.org/images/members/nebulagraph.png" alt="Nebula Graph" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://neo4j.com/" >
+            <img src="https://ldbcouncil.org/images/members/neo4j.png" alt="Neo4j" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.ontotext.com/" >
+            <img src="https://ldbcouncil.org/images/members/ontotext.jpg" alt="Ontotext" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.pometry.com/" >
+            <img src="https://ldbcouncil.org/images/members/pometry.png" alt="Pometry" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://relational.ai/" >
+            <img src="https://ldbcouncil.org/images/members/relationalai.png" alt="RelationalAI" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.sparsity-technologies.com/" >
+            <img src="https://ldbcouncil.org/images/members/sparsity.png" alt="Sparsity" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.stargraph.cn/" >
+            <img src="https://ldbcouncil.org/images/members/stargraph.png" alt="Stargraph" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+        <div class="row row-eq-height">      
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.thatdot.com/" >
+            <img src="https://ldbcouncil.org/images/members/thatdot.png" alt="thatDot" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.tigergraph.com/" >
+            <img src="https://ldbcouncil.org/images/members/tigergraph.png" alt="TigerGraph" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center" style="text-align: center">
+          <a href="https://www.ultipa.com/" >
+            <img src="https://ldbcouncil.org/images/members/ultipa.png" alt="Ultipa" loading="lazy" class="img-fluid company-logo" >
+            
+          </a>
+          </div>
+        
+        </div>      
+        
+      
+      <div class="section-title-border"></div>
+      <!-- Non-profit organizations -->
+      <h3 class="section-title">Non-commercial institutes</h3>
+        <div class="row row-eq-height">
+      
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.bbk.ac.uk/" >
+            <img src="https://ldbcouncil.org/images/members/birkbeck.jpg" alt="Birkbeck, University of London" loading="lazy" class="img-fluid" style="max-width: 80%; height: auto; vertical-align: middle; max-height:300px; max-width:500px; width:100%; padding-bottom: 55px;" >
+          </a>
+          </div>
+      
+          <div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center">
+          <a href="https://www.forth.gr/" >
+            <img src="https://ldbcouncil.org/images/members/forth.png" alt="Forth" loading="lazy" class="img-fluid" style="max-width: 80%; height: auto; vertical-align: middle; max-height:300px; max-width:500px; width:100%; padding-bottom: 55px;" >
+          </a>
+          </div>
+      
+          </div><div class="col-lg-4 px-0 div-wrapper d-flex justify-content-center align-items-center"></div>
+      
+      
+  </div>
+</div>
+
+
+</section>
+<!-- /members -->
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/index.html b/pages/index.html
new file mode 100644
index 00000000..0c9d8ae0
--- /dev/null
+++ b/pages/index.html
@@ -0,0 +1,777 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/">Posts</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/index.xml b/pages/index.xml
new file mode 100644
index 00000000..bc7b14ac
--- /dev/null
+++ b/pages/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Pages on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/pages/</link>
+    <description>Recent content in Pages on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 03 May 2024 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/pages/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/pages/opengql-announce/index.html b/pages/opengql-announce/index.html
new file mode 100644
index 00000000..f3fbc4de
--- /dev/null
+++ b/pages/opengql-announce/index.html
@@ -0,0 +1,382 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC open source GQL tools</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC open-source GQL tools</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC open-source GQL tools</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p><em>By Alastair Green, Vice-chair LDBC, and author of the <a href="https://gql.today">GQL Manifesto</a>.</em></p>
+<p>9 May 2024</p>
+<p>The GQL standard was published in mid-April by ISO. See WG3 Convenor Keith Hare’s summary:  <a href="https://jtc1info.org/slug/gql-database-language/">ISO/IEC JTC 1 GQL Database Language</a></p>
+<p>Linked Data Benchmark Council (<a href="https://ldbcouncil.org">LDBC</a>) is releasing  <strong>early-version open-source GQL grammar tools</strong>.</p>
+<h2 id="open-gql-language-tools">Open GQL Language Tools</h2>
+<p>There are three interlinked projects:</p>
+<ul>
+<li><strong>ANTLR grammar</strong>  <a href="https://github.com/opengql/grammar">repository</a></li>
+<li><strong>GQL Code Editor</strong>  <a href="https://opengql.github.io/editor/">Web UI</a> (and <a href="https://github.com/opengql/editor">repository</a>)</li>
+<li><strong>Railroad Diagrams</strong>  <a href="https://opengql.github.io/railroad/">Web Page</a> (and <a href="https://github.com/opengql/railroad">repository</a>)</li>
+</ul>
+<p>A commit of a new version of the grammar automatically rebuilds and deploys the Code Editor and the Railroad Diagrams.</p>
+<p><strong>Michael Burbidge</strong> (who leads our GQL Implementation Working Group), <strong>Damian Wileński</strong>, and <strong>Dominik Tomaszuk</strong> are responsible for making all this happen, so soon after the release of GQL. Wonderful work!</p>
+<p>The tools are a work in progress, so expect evolution. Feel free to raise issues on Github.</p>
+<p>The mission of the <strong>GQL Implementation Working Group</strong> is to create tooling and documentation to assist in and accelerate the implementation and adoption of GQL. See the <a href="https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf">working group charter</a> for more information.</p>
+<h2 id="code-examples-for-technical-reports">Code examples for Technical Reports</h2>
+<p>The Code Editor lets you create syntactically correct GQL examples. It is not connected to an implementation of the GQL spec, so type checking, variable  scoping rules, etc., that are typically done by semantic analysis of the parse tree, are not enforced by the Code Editor.</p>
+<p>I used Code Editor to create/check the code examples in my last post on LinkedIn, <a href="https://www.linkedin.com/pulse/gql-code-alastair-green-ltbue">GQL in code</a>, which links through to</p>
+<p><span style="font-size:1.5em;"><a href="https://docs.google.com/document/d/e/2PACX-1vT9_yV8J_G-9XnaQ0fgRK0pXrXy3tDIAIBWqWdR09OFo3zo78Bp11ajZJAppGrBAJvvySd8oqmg4A1s/pub">GQL on one page: DDL, DML and GPML</a></span></p>
+<p>It is also being used to help create a forthcoming LDBC Technical Report on GQL, which (unlike the spec) will be freely available to all, and will contain numerous examples.</p>
+<h2 id="towards-a-gql-tck">Towards a GQL TCK</h2>
+<p>More is in the works: we have begun work on a Test Compatibility Kit, modelled on the the openCypher TCK, but that’s a big job.</p>
+<p>We need and welcome active contributions to all these community efforts.</p>
+<p>If you are interested, please ping Michael at <a href="mailto:michael.burbidge@ldbcouncil.org">michael.burbidge@ldbcouncil.org</a>.</p>
+<h2 id="the-linked-data-benchmark-council">The Linked Data Benchmark Council</h2>
+<p>LDBC is a non-profit consortium of vendors, researchers and independent practitioners interested in graph data management.</p>
+<p>LDBC defines benchmark standards for graph data workloads (using RDF, SQL, and property graph languages). It is a meeting point and working space for community efforts supportive of the GQL and SQL/PGQ property graph standards.</p>
+<p>It supervises the <a href="https://arxiv.org/pdf/2307.04350">audited execution of comparable benchmark runs</a> which are reported with cost metrics, following the lead of TPC. Only audited results <a href="https://ldbcouncil.org/benchmarks/snb/">published by LDBC</a> can be described as <a href="https://ldbcouncil.org/benchmarks/fair-use-policies/">LDBC Benchmark(R) results</a>.</p>
+<p>LDBC is run by its 20+ organizational members including Oracle, Ant Group, Intel, Neo4j, TigerGraph, Fabarta, thatDot, Ontotext, ArangoDB, Relational AI, Stargraph, Nebula Graph, Sparksee, FORTH, Memgraph, Createlink, Alibaba DAMO Academy (Graphscope), Birkbeck University of London and AWS.</p>
+<p>There are 70+ individual associate members (who join for free and support its working groups and task forces).</p>
+<p>Recent and current initiatives include the <a href="https://ldbcouncil.org/benchmarks/finbench/">Finance Benchmark</a>, <a href="https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf">LDBC Extended GQL Schema (LEX)</a>, and <a href="https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf">GQL Implementation</a>.</p>
+<p>The G-CORE, PG-Keys, Graph Pattern Matching in GQL and SQL/PGQ and PG-Schema papers (all published at SIGMOD) directly reflect the work of LDBC participants on graph data languages, over the years.</p>
+<p>LDBC is a Category C Liaison of ISO/IEC JTC1 SC32/WG3 (the SQL and GQL standards committee). Jan Hidders, Michael Burbidge and Alastair Green are LDBC’s representatives in WG3.</p>
+<p>For all enquiries, including <a href="https://ldbcouncil.org/becoming-a-member/">membership enquiries</a>, please email <a href="mailto:info@ldbcouncil.org">info@ldbcouncil.org</a>.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page-name/index.html b/pages/page-name/index.html
new file mode 100644
index 00000000..76749792
--- /dev/null
+++ b/pages/page-name/index.html
@@ -0,0 +1,342 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title></title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3"></h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page"></li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        
+      </div>
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/1/index.html b/pages/page/1/index.html
new file mode 100644
index 00000000..cb682eb1
--- /dev/null
+++ b/pages/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/pages/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/pages/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/pages/">
+  </head>
+</html>
diff --git a/pages/page/2/index.html b/pages/page/2/index.html
new file mode 100644
index 00000000..4f29620e
--- /dev/null
+++ b/pages/page/2/index.html
@@ -0,0 +1,804 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/3/index.html b/pages/page/3/index.html
new file mode 100644
index 00000000..c41c3366
--- /dev/null
+++ b/pages/page/3/index.html
@@ -0,0 +1,796 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/4/index.html b/pages/page/4/index.html
new file mode 100644
index 00000000..e19c20e7
--- /dev/null
+++ b/pages/page/4/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/5/index.html b/pages/page/5/index.html
new file mode 100644
index 00000000..1d6b0a9e
--- /dev/null
+++ b/pages/page/5/index.html
@@ -0,0 +1,768 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/6/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/6/index.html b/pages/page/6/index.html
new file mode 100644
index 00000000..1cc4a65a
--- /dev/null
+++ b/pages/page/6/index.html
@@ -0,0 +1,776 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/5/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/7/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/7/index.html b/pages/page/7/index.html
new file mode 100644
index 00000000..a17ef87b
--- /dev/null
+++ b/pages/page/7/index.html
@@ -0,0 +1,794 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/6/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/8/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/pages/page/8/index.html b/pages/page/8/index.html
new file mode 100644
index 00000000..4213869e
--- /dev/null
+++ b/pages/page/8/index.html
@@ -0,0 +1,709 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Pages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Pages</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Pages</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/pages/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/pages/page/7/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/pages/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/pages/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/plugins/animate/animate.css b/plugins/animate/animate.css
new file mode 100644
index 00000000..943f8454
--- /dev/null
+++ b/plugins/animate/animate.css
@@ -0,0 +1,3623 @@
+@charset "UTF-8";
+
+/*!
+ * animate.css -http://daneden.me/animate
+ * Version - 3.7.0
+ * Licensed under the MIT license - http://opensource.org/licenses/MIT
+ *
+ * Copyright (c) 2018 Daniel Eden
+ */
+
+@-webkit-keyframes bounce {
+  from,
+  20%,
+  53%,
+  80%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  40%,
+  43% {
+    -webkit-animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    -webkit-transform: translate3d(0, -30px, 0);
+    transform: translate3d(0, -30px, 0);
+  }
+
+  70% {
+    -webkit-animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    -webkit-transform: translate3d(0, -15px, 0);
+    transform: translate3d(0, -15px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, -4px, 0);
+    transform: translate3d(0, -4px, 0);
+  }
+}
+
+@keyframes bounce {
+  from,
+  20%,
+  53%,
+  80%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  40%,
+  43% {
+    -webkit-animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    -webkit-transform: translate3d(0, -30px, 0);
+    transform: translate3d(0, -30px, 0);
+  }
+
+  70% {
+    -webkit-animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    animation-timing-function: cubic-bezier(0.755, 0.05, 0.855, 0.06);
+    -webkit-transform: translate3d(0, -15px, 0);
+    transform: translate3d(0, -15px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, -4px, 0);
+    transform: translate3d(0, -4px, 0);
+  }
+}
+
+.bounce {
+  -webkit-animation-name: bounce;
+  animation-name: bounce;
+  -webkit-transform-origin: center bottom;
+  transform-origin: center bottom;
+}
+
+@-webkit-keyframes flash {
+  from,
+  50%,
+  to {
+    opacity: 1;
+  }
+
+  25%,
+  75% {
+    opacity: 0;
+  }
+}
+
+@keyframes flash {
+  from,
+  50%,
+  to {
+    opacity: 1;
+  }
+
+  25%,
+  75% {
+    opacity: 0;
+  }
+}
+
+.flash {
+  -webkit-animation-name: flash;
+  animation-name: flash;
+}
+
+/* originally authored by Nick Pettit - https://github.com/nickpettit/glide */
+
+@-webkit-keyframes pulse {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  50% {
+    -webkit-transform: scale3d(1.05, 1.05, 1.05);
+    transform: scale3d(1.05, 1.05, 1.05);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+@keyframes pulse {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  50% {
+    -webkit-transform: scale3d(1.05, 1.05, 1.05);
+    transform: scale3d(1.05, 1.05, 1.05);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+.pulse {
+  -webkit-animation-name: pulse;
+  animation-name: pulse;
+}
+
+@-webkit-keyframes rubberBand {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  30% {
+    -webkit-transform: scale3d(1.25, 0.75, 1);
+    transform: scale3d(1.25, 0.75, 1);
+  }
+
+  40% {
+    -webkit-transform: scale3d(0.75, 1.25, 1);
+    transform: scale3d(0.75, 1.25, 1);
+  }
+
+  50% {
+    -webkit-transform: scale3d(1.15, 0.85, 1);
+    transform: scale3d(1.15, 0.85, 1);
+  }
+
+  65% {
+    -webkit-transform: scale3d(0.95, 1.05, 1);
+    transform: scale3d(0.95, 1.05, 1);
+  }
+
+  75% {
+    -webkit-transform: scale3d(1.05, 0.95, 1);
+    transform: scale3d(1.05, 0.95, 1);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+@keyframes rubberBand {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  30% {
+    -webkit-transform: scale3d(1.25, 0.75, 1);
+    transform: scale3d(1.25, 0.75, 1);
+  }
+
+  40% {
+    -webkit-transform: scale3d(0.75, 1.25, 1);
+    transform: scale3d(0.75, 1.25, 1);
+  }
+
+  50% {
+    -webkit-transform: scale3d(1.15, 0.85, 1);
+    transform: scale3d(1.15, 0.85, 1);
+  }
+
+  65% {
+    -webkit-transform: scale3d(0.95, 1.05, 1);
+    transform: scale3d(0.95, 1.05, 1);
+  }
+
+  75% {
+    -webkit-transform: scale3d(1.05, 0.95, 1);
+    transform: scale3d(1.05, 0.95, 1);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+.rubberBand {
+  -webkit-animation-name: rubberBand;
+  animation-name: rubberBand;
+}
+
+@-webkit-keyframes shake {
+  from,
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  10%,
+  30%,
+  50%,
+  70%,
+  90% {
+    -webkit-transform: translate3d(-10px, 0, 0);
+    transform: translate3d(-10px, 0, 0);
+  }
+
+  20%,
+  40%,
+  60%,
+  80% {
+    -webkit-transform: translate3d(10px, 0, 0);
+    transform: translate3d(10px, 0, 0);
+  }
+}
+
+@keyframes shake {
+  from,
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  10%,
+  30%,
+  50%,
+  70%,
+  90% {
+    -webkit-transform: translate3d(-10px, 0, 0);
+    transform: translate3d(-10px, 0, 0);
+  }
+
+  20%,
+  40%,
+  60%,
+  80% {
+    -webkit-transform: translate3d(10px, 0, 0);
+    transform: translate3d(10px, 0, 0);
+  }
+}
+
+.shake {
+  -webkit-animation-name: shake;
+  animation-name: shake;
+}
+
+@-webkit-keyframes headShake {
+  0% {
+    -webkit-transform: translateX(0);
+    transform: translateX(0);
+  }
+
+  6.5% {
+    -webkit-transform: translateX(-6px) rotateY(-9deg);
+    transform: translateX(-6px) rotateY(-9deg);
+  }
+
+  18.5% {
+    -webkit-transform: translateX(5px) rotateY(7deg);
+    transform: translateX(5px) rotateY(7deg);
+  }
+
+  31.5% {
+    -webkit-transform: translateX(-3px) rotateY(-5deg);
+    transform: translateX(-3px) rotateY(-5deg);
+  }
+
+  43.5% {
+    -webkit-transform: translateX(2px) rotateY(3deg);
+    transform: translateX(2px) rotateY(3deg);
+  }
+
+  50% {
+    -webkit-transform: translateX(0);
+    transform: translateX(0);
+  }
+}
+
+@keyframes headShake {
+  0% {
+    -webkit-transform: translateX(0);
+    transform: translateX(0);
+  }
+
+  6.5% {
+    -webkit-transform: translateX(-6px) rotateY(-9deg);
+    transform: translateX(-6px) rotateY(-9deg);
+  }
+
+  18.5% {
+    -webkit-transform: translateX(5px) rotateY(7deg);
+    transform: translateX(5px) rotateY(7deg);
+  }
+
+  31.5% {
+    -webkit-transform: translateX(-3px) rotateY(-5deg);
+    transform: translateX(-3px) rotateY(-5deg);
+  }
+
+  43.5% {
+    -webkit-transform: translateX(2px) rotateY(3deg);
+    transform: translateX(2px) rotateY(3deg);
+  }
+
+  50% {
+    -webkit-transform: translateX(0);
+    transform: translateX(0);
+  }
+}
+
+.headShake {
+  -webkit-animation-timing-function: ease-in-out;
+  animation-timing-function: ease-in-out;
+  -webkit-animation-name: headShake;
+  animation-name: headShake;
+}
+
+@-webkit-keyframes swing {
+  20% {
+    -webkit-transform: rotate3d(0, 0, 1, 15deg);
+    transform: rotate3d(0, 0, 1, 15deg);
+  }
+
+  40% {
+    -webkit-transform: rotate3d(0, 0, 1, -10deg);
+    transform: rotate3d(0, 0, 1, -10deg);
+  }
+
+  60% {
+    -webkit-transform: rotate3d(0, 0, 1, 5deg);
+    transform: rotate3d(0, 0, 1, 5deg);
+  }
+
+  80% {
+    -webkit-transform: rotate3d(0, 0, 1, -5deg);
+    transform: rotate3d(0, 0, 1, -5deg);
+  }
+
+  to {
+    -webkit-transform: rotate3d(0, 0, 1, 0deg);
+    transform: rotate3d(0, 0, 1, 0deg);
+  }
+}
+
+@keyframes swing {
+  20% {
+    -webkit-transform: rotate3d(0, 0, 1, 15deg);
+    transform: rotate3d(0, 0, 1, 15deg);
+  }
+
+  40% {
+    -webkit-transform: rotate3d(0, 0, 1, -10deg);
+    transform: rotate3d(0, 0, 1, -10deg);
+  }
+
+  60% {
+    -webkit-transform: rotate3d(0, 0, 1, 5deg);
+    transform: rotate3d(0, 0, 1, 5deg);
+  }
+
+  80% {
+    -webkit-transform: rotate3d(0, 0, 1, -5deg);
+    transform: rotate3d(0, 0, 1, -5deg);
+  }
+
+  to {
+    -webkit-transform: rotate3d(0, 0, 1, 0deg);
+    transform: rotate3d(0, 0, 1, 0deg);
+  }
+}
+
+.swing {
+  -webkit-transform-origin: top center;
+  transform-origin: top center;
+  -webkit-animation-name: swing;
+  animation-name: swing;
+}
+
+@-webkit-keyframes tada {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  10%,
+  20% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9) rotate3d(0, 0, 1, -3deg);
+    transform: scale3d(0.9, 0.9, 0.9) rotate3d(0, 0, 1, -3deg);
+  }
+
+  30%,
+  50%,
+  70%,
+  90% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, 3deg);
+    transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, 3deg);
+  }
+
+  40%,
+  60%,
+  80% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, -3deg);
+    transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, -3deg);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+@keyframes tada {
+  from {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+
+  10%,
+  20% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9) rotate3d(0, 0, 1, -3deg);
+    transform: scale3d(0.9, 0.9, 0.9) rotate3d(0, 0, 1, -3deg);
+  }
+
+  30%,
+  50%,
+  70%,
+  90% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, 3deg);
+    transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, 3deg);
+  }
+
+  40%,
+  60%,
+  80% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, -3deg);
+    transform: scale3d(1.1, 1.1, 1.1) rotate3d(0, 0, 1, -3deg);
+  }
+
+  to {
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+.tada {
+  -webkit-animation-name: tada;
+  animation-name: tada;
+}
+
+/* originally authored by Nick Pettit - https://github.com/nickpettit/glide */
+
+@-webkit-keyframes wobble {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  15% {
+    -webkit-transform: translate3d(-25%, 0, 0) rotate3d(0, 0, 1, -5deg);
+    transform: translate3d(-25%, 0, 0) rotate3d(0, 0, 1, -5deg);
+  }
+
+  30% {
+    -webkit-transform: translate3d(20%, 0, 0) rotate3d(0, 0, 1, 3deg);
+    transform: translate3d(20%, 0, 0) rotate3d(0, 0, 1, 3deg);
+  }
+
+  45% {
+    -webkit-transform: translate3d(-15%, 0, 0) rotate3d(0, 0, 1, -3deg);
+    transform: translate3d(-15%, 0, 0) rotate3d(0, 0, 1, -3deg);
+  }
+
+  60% {
+    -webkit-transform: translate3d(10%, 0, 0) rotate3d(0, 0, 1, 2deg);
+    transform: translate3d(10%, 0, 0) rotate3d(0, 0, 1, 2deg);
+  }
+
+  75% {
+    -webkit-transform: translate3d(-5%, 0, 0) rotate3d(0, 0, 1, -1deg);
+    transform: translate3d(-5%, 0, 0) rotate3d(0, 0, 1, -1deg);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes wobble {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  15% {
+    -webkit-transform: translate3d(-25%, 0, 0) rotate3d(0, 0, 1, -5deg);
+    transform: translate3d(-25%, 0, 0) rotate3d(0, 0, 1, -5deg);
+  }
+
+  30% {
+    -webkit-transform: translate3d(20%, 0, 0) rotate3d(0, 0, 1, 3deg);
+    transform: translate3d(20%, 0, 0) rotate3d(0, 0, 1, 3deg);
+  }
+
+  45% {
+    -webkit-transform: translate3d(-15%, 0, 0) rotate3d(0, 0, 1, -3deg);
+    transform: translate3d(-15%, 0, 0) rotate3d(0, 0, 1, -3deg);
+  }
+
+  60% {
+    -webkit-transform: translate3d(10%, 0, 0) rotate3d(0, 0, 1, 2deg);
+    transform: translate3d(10%, 0, 0) rotate3d(0, 0, 1, 2deg);
+  }
+
+  75% {
+    -webkit-transform: translate3d(-5%, 0, 0) rotate3d(0, 0, 1, -1deg);
+    transform: translate3d(-5%, 0, 0) rotate3d(0, 0, 1, -1deg);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.wobble {
+  -webkit-animation-name: wobble;
+  animation-name: wobble;
+}
+
+@-webkit-keyframes jello {
+  from,
+  11.1%,
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  22.2% {
+    -webkit-transform: skewX(-12.5deg) skewY(-12.5deg);
+    transform: skewX(-12.5deg) skewY(-12.5deg);
+  }
+
+  33.3% {
+    -webkit-transform: skewX(6.25deg) skewY(6.25deg);
+    transform: skewX(6.25deg) skewY(6.25deg);
+  }
+
+  44.4% {
+    -webkit-transform: skewX(-3.125deg) skewY(-3.125deg);
+    transform: skewX(-3.125deg) skewY(-3.125deg);
+  }
+
+  55.5% {
+    -webkit-transform: skewX(1.5625deg) skewY(1.5625deg);
+    transform: skewX(1.5625deg) skewY(1.5625deg);
+  }
+
+  66.6% {
+    -webkit-transform: skewX(-0.78125deg) skewY(-0.78125deg);
+    transform: skewX(-0.78125deg) skewY(-0.78125deg);
+  }
+
+  77.7% {
+    -webkit-transform: skewX(0.390625deg) skewY(0.390625deg);
+    transform: skewX(0.390625deg) skewY(0.390625deg);
+  }
+
+  88.8% {
+    -webkit-transform: skewX(-0.1953125deg) skewY(-0.1953125deg);
+    transform: skewX(-0.1953125deg) skewY(-0.1953125deg);
+  }
+}
+
+@keyframes jello {
+  from,
+  11.1%,
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  22.2% {
+    -webkit-transform: skewX(-12.5deg) skewY(-12.5deg);
+    transform: skewX(-12.5deg) skewY(-12.5deg);
+  }
+
+  33.3% {
+    -webkit-transform: skewX(6.25deg) skewY(6.25deg);
+    transform: skewX(6.25deg) skewY(6.25deg);
+  }
+
+  44.4% {
+    -webkit-transform: skewX(-3.125deg) skewY(-3.125deg);
+    transform: skewX(-3.125deg) skewY(-3.125deg);
+  }
+
+  55.5% {
+    -webkit-transform: skewX(1.5625deg) skewY(1.5625deg);
+    transform: skewX(1.5625deg) skewY(1.5625deg);
+  }
+
+  66.6% {
+    -webkit-transform: skewX(-0.78125deg) skewY(-0.78125deg);
+    transform: skewX(-0.78125deg) skewY(-0.78125deg);
+  }
+
+  77.7% {
+    -webkit-transform: skewX(0.390625deg) skewY(0.390625deg);
+    transform: skewX(0.390625deg) skewY(0.390625deg);
+  }
+
+  88.8% {
+    -webkit-transform: skewX(-0.1953125deg) skewY(-0.1953125deg);
+    transform: skewX(-0.1953125deg) skewY(-0.1953125deg);
+  }
+}
+
+.jello {
+  -webkit-animation-name: jello;
+  animation-name: jello;
+  -webkit-transform-origin: center;
+  transform-origin: center;
+}
+
+@-webkit-keyframes heartBeat {
+  0% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+
+  14% {
+    -webkit-transform: scale(1.3);
+    transform: scale(1.3);
+  }
+
+  28% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+
+  42% {
+    -webkit-transform: scale(1.3);
+    transform: scale(1.3);
+  }
+
+  70% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+}
+
+@keyframes heartBeat {
+  0% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+
+  14% {
+    -webkit-transform: scale(1.3);
+    transform: scale(1.3);
+  }
+
+  28% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+
+  42% {
+    -webkit-transform: scale(1.3);
+    transform: scale(1.3);
+  }
+
+  70% {
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+}
+
+.heartBeat {
+  -webkit-animation-name: heartBeat;
+  animation-name: heartBeat;
+  -webkit-animation-duration: 1.3s;
+  animation-duration: 1.3s;
+  -webkit-animation-timing-function: ease-in-out;
+  animation-timing-function: ease-in-out;
+}
+
+@-webkit-keyframes bounceIn {
+  from,
+  20%,
+  40%,
+  60%,
+  80%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  20% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1);
+    transform: scale3d(1.1, 1.1, 1.1);
+  }
+
+  40% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9);
+    transform: scale3d(0.9, 0.9, 0.9);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(1.03, 1.03, 1.03);
+    transform: scale3d(1.03, 1.03, 1.03);
+  }
+
+  80% {
+    -webkit-transform: scale3d(0.97, 0.97, 0.97);
+    transform: scale3d(0.97, 0.97, 0.97);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+@keyframes bounceIn {
+  from,
+  20%,
+  40%,
+  60%,
+  80%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  20% {
+    -webkit-transform: scale3d(1.1, 1.1, 1.1);
+    transform: scale3d(1.1, 1.1, 1.1);
+  }
+
+  40% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9);
+    transform: scale3d(0.9, 0.9, 0.9);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(1.03, 1.03, 1.03);
+    transform: scale3d(1.03, 1.03, 1.03);
+  }
+
+  80% {
+    -webkit-transform: scale3d(0.97, 0.97, 0.97);
+    transform: scale3d(0.97, 0.97, 0.97);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: scale3d(1, 1, 1);
+    transform: scale3d(1, 1, 1);
+  }
+}
+
+.bounceIn {
+  -webkit-animation-duration: 0.75s;
+  animation-duration: 0.75s;
+  -webkit-animation-name: bounceIn;
+  animation-name: bounceIn;
+}
+
+@-webkit-keyframes bounceInDown {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -3000px, 0);
+    transform: translate3d(0, -3000px, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 25px, 0);
+    transform: translate3d(0, 25px, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(0, -10px, 0);
+    transform: translate3d(0, -10px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, 5px, 0);
+    transform: translate3d(0, 5px, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes bounceInDown {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -3000px, 0);
+    transform: translate3d(0, -3000px, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 25px, 0);
+    transform: translate3d(0, 25px, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(0, -10px, 0);
+    transform: translate3d(0, -10px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, 5px, 0);
+    transform: translate3d(0, 5px, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.bounceInDown {
+  -webkit-animation-name: bounceInDown;
+  animation-name: bounceInDown;
+}
+
+@-webkit-keyframes bounceInLeft {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: translate3d(-3000px, 0, 0);
+    transform: translate3d(-3000px, 0, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(25px, 0, 0);
+    transform: translate3d(25px, 0, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(-10px, 0, 0);
+    transform: translate3d(-10px, 0, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(5px, 0, 0);
+    transform: translate3d(5px, 0, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes bounceInLeft {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  0% {
+    opacity: 0;
+    -webkit-transform: translate3d(-3000px, 0, 0);
+    transform: translate3d(-3000px, 0, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(25px, 0, 0);
+    transform: translate3d(25px, 0, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(-10px, 0, 0);
+    transform: translate3d(-10px, 0, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(5px, 0, 0);
+    transform: translate3d(5px, 0, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.bounceInLeft {
+  -webkit-animation-name: bounceInLeft;
+  animation-name: bounceInLeft;
+}
+
+@-webkit-keyframes bounceInRight {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(3000px, 0, 0);
+    transform: translate3d(3000px, 0, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(-25px, 0, 0);
+    transform: translate3d(-25px, 0, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(10px, 0, 0);
+    transform: translate3d(10px, 0, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(-5px, 0, 0);
+    transform: translate3d(-5px, 0, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes bounceInRight {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(3000px, 0, 0);
+    transform: translate3d(3000px, 0, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(-25px, 0, 0);
+    transform: translate3d(-25px, 0, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(10px, 0, 0);
+    transform: translate3d(10px, 0, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(-5px, 0, 0);
+    transform: translate3d(-5px, 0, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.bounceInRight {
+  -webkit-animation-name: bounceInRight;
+  animation-name: bounceInRight;
+}
+
+@-webkit-keyframes bounceInUp {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 3000px, 0);
+    transform: translate3d(0, 3000px, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, -20px, 0);
+    transform: translate3d(0, -20px, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(0, 10px, 0);
+    transform: translate3d(0, 10px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, -5px, 0);
+    transform: translate3d(0, -5px, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes bounceInUp {
+  from,
+  60%,
+  75%,
+  90%,
+  to {
+    -webkit-animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+    animation-timing-function: cubic-bezier(0.215, 0.61, 0.355, 1);
+  }
+
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 3000px, 0);
+    transform: translate3d(0, 3000px, 0);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, -20px, 0);
+    transform: translate3d(0, -20px, 0);
+  }
+
+  75% {
+    -webkit-transform: translate3d(0, 10px, 0);
+    transform: translate3d(0, 10px, 0);
+  }
+
+  90% {
+    -webkit-transform: translate3d(0, -5px, 0);
+    transform: translate3d(0, -5px, 0);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.bounceInUp {
+  -webkit-animation-name: bounceInUp;
+  animation-name: bounceInUp;
+}
+
+@-webkit-keyframes bounceOut {
+  20% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9);
+    transform: scale3d(0.9, 0.9, 0.9);
+  }
+
+  50%,
+  55% {
+    opacity: 1;
+    -webkit-transform: scale3d(1.1, 1.1, 1.1);
+    transform: scale3d(1.1, 1.1, 1.1);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+}
+
+@keyframes bounceOut {
+  20% {
+    -webkit-transform: scale3d(0.9, 0.9, 0.9);
+    transform: scale3d(0.9, 0.9, 0.9);
+  }
+
+  50%,
+  55% {
+    opacity: 1;
+    -webkit-transform: scale3d(1.1, 1.1, 1.1);
+    transform: scale3d(1.1, 1.1, 1.1);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+}
+
+.bounceOut {
+  -webkit-animation-duration: 0.75s;
+  animation-duration: 0.75s;
+  -webkit-animation-name: bounceOut;
+  animation-name: bounceOut;
+}
+
+@-webkit-keyframes bounceOutDown {
+  20% {
+    -webkit-transform: translate3d(0, 10px, 0);
+    transform: translate3d(0, 10px, 0);
+  }
+
+  40%,
+  45% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, -20px, 0);
+    transform: translate3d(0, -20px, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+}
+
+@keyframes bounceOutDown {
+  20% {
+    -webkit-transform: translate3d(0, 10px, 0);
+    transform: translate3d(0, 10px, 0);
+  }
+
+  40%,
+  45% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, -20px, 0);
+    transform: translate3d(0, -20px, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+}
+
+.bounceOutDown {
+  -webkit-animation-name: bounceOutDown;
+  animation-name: bounceOutDown;
+}
+
+@-webkit-keyframes bounceOutLeft {
+  20% {
+    opacity: 1;
+    -webkit-transform: translate3d(20px, 0, 0);
+    transform: translate3d(20px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+}
+
+@keyframes bounceOutLeft {
+  20% {
+    opacity: 1;
+    -webkit-transform: translate3d(20px, 0, 0);
+    transform: translate3d(20px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+}
+
+.bounceOutLeft {
+  -webkit-animation-name: bounceOutLeft;
+  animation-name: bounceOutLeft;
+}
+
+@-webkit-keyframes bounceOutRight {
+  20% {
+    opacity: 1;
+    -webkit-transform: translate3d(-20px, 0, 0);
+    transform: translate3d(-20px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+}
+
+@keyframes bounceOutRight {
+  20% {
+    opacity: 1;
+    -webkit-transform: translate3d(-20px, 0, 0);
+    transform: translate3d(-20px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+}
+
+.bounceOutRight {
+  -webkit-animation-name: bounceOutRight;
+  animation-name: bounceOutRight;
+}
+
+@-webkit-keyframes bounceOutUp {
+  20% {
+    -webkit-transform: translate3d(0, -10px, 0);
+    transform: translate3d(0, -10px, 0);
+  }
+
+  40%,
+  45% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 20px, 0);
+    transform: translate3d(0, 20px, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+}
+
+@keyframes bounceOutUp {
+  20% {
+    -webkit-transform: translate3d(0, -10px, 0);
+    transform: translate3d(0, -10px, 0);
+  }
+
+  40%,
+  45% {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 20px, 0);
+    transform: translate3d(0, 20px, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+}
+
+.bounceOutUp {
+  -webkit-animation-name: bounceOutUp;
+  animation-name: bounceOutUp;
+}
+
+@-webkit-keyframes fadeIn {
+  from {
+    opacity: 0;
+  }
+
+  to {
+    opacity: 1;
+  }
+}
+
+@keyframes fadeIn {
+  from {
+    opacity: 0;
+  }
+
+  to {
+    opacity: 1;
+  }
+}
+
+.fadeIn {
+  -webkit-animation-name: fadeIn;
+  animation-name: fadeIn;
+}
+
+@-webkit-keyframes fadeInDown {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInDown {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInDown {
+  -webkit-animation-name: fadeInDown;
+  animation-name: fadeInDown;
+}
+
+@-webkit-keyframes fadeInDownBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInDownBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInDownBig {
+  -webkit-animation-name: fadeInDownBig;
+  animation-name: fadeInDownBig;
+}
+
+@-webkit-keyframes fadeInLeft {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInLeft {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInLeft {
+  -webkit-animation-name: fadeInLeft;
+  animation-name: fadeInLeft;
+}
+
+@-webkit-keyframes fadeInLeftBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInLeftBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInLeftBig {
+  -webkit-animation-name: fadeInLeftBig;
+  animation-name: fadeInLeftBig;
+}
+
+@-webkit-keyframes fadeInRight {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInRight {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInRight {
+  -webkit-animation-name: fadeInRight;
+  animation-name: fadeInRight;
+}
+
+@-webkit-keyframes fadeInRightBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInRightBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInRightBig {
+  -webkit-animation-name: fadeInRightBig;
+  animation-name: fadeInRightBig;
+}
+
+@-webkit-keyframes fadeInUp {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInUp {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInUp {
+  -webkit-animation-name: fadeInUp;
+  animation-name: fadeInUp;
+}
+
+@-webkit-keyframes fadeInUpBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes fadeInUpBig {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.fadeInUpBig {
+  -webkit-animation-name: fadeInUpBig;
+  animation-name: fadeInUpBig;
+}
+
+@-webkit-keyframes fadeOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+  }
+}
+
+@keyframes fadeOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+  }
+}
+
+.fadeOut {
+  -webkit-animation-name: fadeOut;
+  animation-name: fadeOut;
+}
+
+@-webkit-keyframes fadeOutDown {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+}
+
+@keyframes fadeOutDown {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+}
+
+.fadeOutDown {
+  -webkit-animation-name: fadeOutDown;
+  animation-name: fadeOutDown;
+}
+
+@-webkit-keyframes fadeOutDownBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+}
+
+@keyframes fadeOutDownBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, 2000px, 0);
+    transform: translate3d(0, 2000px, 0);
+  }
+}
+
+.fadeOutDownBig {
+  -webkit-animation-name: fadeOutDownBig;
+  animation-name: fadeOutDownBig;
+}
+
+@-webkit-keyframes fadeOutLeft {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+}
+
+@keyframes fadeOutLeft {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+}
+
+.fadeOutLeft {
+  -webkit-animation-name: fadeOutLeft;
+  animation-name: fadeOutLeft;
+}
+
+@-webkit-keyframes fadeOutLeftBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+}
+
+@keyframes fadeOutLeftBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(-2000px, 0, 0);
+    transform: translate3d(-2000px, 0, 0);
+  }
+}
+
+.fadeOutLeftBig {
+  -webkit-animation-name: fadeOutLeftBig;
+  animation-name: fadeOutLeftBig;
+}
+
+@-webkit-keyframes fadeOutRight {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+}
+
+@keyframes fadeOutRight {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+}
+
+.fadeOutRight {
+  -webkit-animation-name: fadeOutRight;
+  animation-name: fadeOutRight;
+}
+
+@-webkit-keyframes fadeOutRightBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+}
+
+@keyframes fadeOutRightBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(2000px, 0, 0);
+    transform: translate3d(2000px, 0, 0);
+  }
+}
+
+.fadeOutRightBig {
+  -webkit-animation-name: fadeOutRightBig;
+  animation-name: fadeOutRightBig;
+}
+
+@-webkit-keyframes fadeOutUp {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+}
+
+@keyframes fadeOutUp {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+}
+
+.fadeOutUp {
+  -webkit-animation-name: fadeOutUp;
+  animation-name: fadeOutUp;
+}
+
+@-webkit-keyframes fadeOutUpBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+}
+
+@keyframes fadeOutUpBig {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(0, -2000px, 0);
+    transform: translate3d(0, -2000px, 0);
+  }
+}
+
+.fadeOutUpBig {
+  -webkit-animation-name: fadeOutUpBig;
+  animation-name: fadeOutUpBig;
+}
+
+@-webkit-keyframes flip {
+  from {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, -360deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0) rotate3d(0, 1, 0, -360deg);
+    -webkit-animation-timing-function: ease-out;
+    animation-timing-function: ease-out;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -190deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -190deg);
+    -webkit-animation-timing-function: ease-out;
+    animation-timing-function: ease-out;
+  }
+
+  50% {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -170deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -170deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) scale3d(0.95, 0.95, 0.95) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    transform: perspective(400px) scale3d(0.95, 0.95, 0.95) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0) rotate3d(0, 1, 0, 0deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+}
+
+@keyframes flip {
+  from {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, -360deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0) rotate3d(0, 1, 0, -360deg);
+    -webkit-animation-timing-function: ease-out;
+    animation-timing-function: ease-out;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -190deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -190deg);
+    -webkit-animation-timing-function: ease-out;
+    animation-timing-function: ease-out;
+  }
+
+  50% {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -170deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 150px)
+      rotate3d(0, 1, 0, -170deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) scale3d(0.95, 0.95, 0.95) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    transform: perspective(400px) scale3d(0.95, 0.95, 0.95) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0)
+      rotate3d(0, 1, 0, 0deg);
+    transform: perspective(400px) scale3d(1, 1, 1) translate3d(0, 0, 0) rotate3d(0, 1, 0, 0deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+}
+
+.animated.flip {
+  -webkit-backface-visibility: visible;
+  backface-visibility: visible;
+  -webkit-animation-name: flip;
+  animation-name: flip;
+}
+
+@-webkit-keyframes flipInX {
+  from {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+    opacity: 0;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  60% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 10deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 10deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -5deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -5deg);
+  }
+
+  to {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+}
+
+@keyframes flipInX {
+  from {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+    opacity: 0;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  60% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 10deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 10deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -5deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -5deg);
+  }
+
+  to {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+}
+
+.flipInX {
+  -webkit-backface-visibility: visible !important;
+  backface-visibility: visible !important;
+  -webkit-animation-name: flipInX;
+  animation-name: flipInX;
+}
+
+@-webkit-keyframes flipInY {
+  from {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+    opacity: 0;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -20deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -20deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  60% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 10deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 10deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -5deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -5deg);
+  }
+
+  to {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+}
+
+@keyframes flipInY {
+  from {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+    opacity: 0;
+  }
+
+  40% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -20deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -20deg);
+    -webkit-animation-timing-function: ease-in;
+    animation-timing-function: ease-in;
+  }
+
+  60% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 10deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 10deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -5deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -5deg);
+  }
+
+  to {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+}
+
+.flipInY {
+  -webkit-backface-visibility: visible !important;
+  backface-visibility: visible !important;
+  -webkit-animation-name: flipInY;
+  animation-name: flipInY;
+}
+
+@-webkit-keyframes flipOutX {
+  from {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+
+  30% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    opacity: 0;
+  }
+}
+
+@keyframes flipOutX {
+  from {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+
+  30% {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, -20deg);
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    transform: perspective(400px) rotate3d(1, 0, 0, 90deg);
+    opacity: 0;
+  }
+}
+
+.flipOutX {
+  -webkit-animation-duration: 0.75s;
+  animation-duration: 0.75s;
+  -webkit-animation-name: flipOutX;
+  animation-name: flipOutX;
+  -webkit-backface-visibility: visible !important;
+  backface-visibility: visible !important;
+}
+
+@-webkit-keyframes flipOutY {
+  from {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+
+  30% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -15deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -15deg);
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    opacity: 0;
+  }
+}
+
+@keyframes flipOutY {
+  from {
+    -webkit-transform: perspective(400px);
+    transform: perspective(400px);
+  }
+
+  30% {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, -15deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, -15deg);
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    transform: perspective(400px) rotate3d(0, 1, 0, 90deg);
+    opacity: 0;
+  }
+}
+
+.flipOutY {
+  -webkit-animation-duration: 0.75s;
+  animation-duration: 0.75s;
+  -webkit-backface-visibility: visible !important;
+  backface-visibility: visible !important;
+  -webkit-animation-name: flipOutY;
+  animation-name: flipOutY;
+}
+
+@-webkit-keyframes lightSpeedIn {
+  from {
+    -webkit-transform: translate3d(100%, 0, 0) skewX(-30deg);
+    transform: translate3d(100%, 0, 0) skewX(-30deg);
+    opacity: 0;
+  }
+
+  60% {
+    -webkit-transform: skewX(20deg);
+    transform: skewX(20deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: skewX(-5deg);
+    transform: skewX(-5deg);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes lightSpeedIn {
+  from {
+    -webkit-transform: translate3d(100%, 0, 0) skewX(-30deg);
+    transform: translate3d(100%, 0, 0) skewX(-30deg);
+    opacity: 0;
+  }
+
+  60% {
+    -webkit-transform: skewX(20deg);
+    transform: skewX(20deg);
+    opacity: 1;
+  }
+
+  80% {
+    -webkit-transform: skewX(-5deg);
+    transform: skewX(-5deg);
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.lightSpeedIn {
+  -webkit-animation-name: lightSpeedIn;
+  animation-name: lightSpeedIn;
+  -webkit-animation-timing-function: ease-out;
+  animation-timing-function: ease-out;
+}
+
+@-webkit-keyframes lightSpeedOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: translate3d(100%, 0, 0) skewX(30deg);
+    transform: translate3d(100%, 0, 0) skewX(30deg);
+    opacity: 0;
+  }
+}
+
+@keyframes lightSpeedOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: translate3d(100%, 0, 0) skewX(30deg);
+    transform: translate3d(100%, 0, 0) skewX(30deg);
+    opacity: 0;
+  }
+}
+
+.lightSpeedOut {
+  -webkit-animation-name: lightSpeedOut;
+  animation-name: lightSpeedOut;
+  -webkit-animation-timing-function: ease-in;
+  animation-timing-function: ease-in;
+}
+
+@-webkit-keyframes rotateIn {
+  from {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: rotate3d(0, 0, 1, -200deg);
+    transform: rotate3d(0, 0, 1, -200deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+@keyframes rotateIn {
+  from {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: rotate3d(0, 0, 1, -200deg);
+    transform: rotate3d(0, 0, 1, -200deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+.rotateIn {
+  -webkit-animation-name: rotateIn;
+  animation-name: rotateIn;
+}
+
+@-webkit-keyframes rotateInDownLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+@keyframes rotateInDownLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+.rotateInDownLeft {
+  -webkit-animation-name: rotateInDownLeft;
+  animation-name: rotateInDownLeft;
+}
+
+@-webkit-keyframes rotateInDownRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+@keyframes rotateInDownRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+.rotateInDownRight {
+  -webkit-animation-name: rotateInDownRight;
+  animation-name: rotateInDownRight;
+}
+
+@-webkit-keyframes rotateInUpLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+@keyframes rotateInUpLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+.rotateInUpLeft {
+  -webkit-animation-name: rotateInUpLeft;
+  animation-name: rotateInUpLeft;
+}
+
+@-webkit-keyframes rotateInUpRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -90deg);
+    transform: rotate3d(0, 0, 1, -90deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+@keyframes rotateInUpRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -90deg);
+    transform: rotate3d(0, 0, 1, -90deg);
+    opacity: 0;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+    opacity: 1;
+  }
+}
+
+.rotateInUpRight {
+  -webkit-animation-name: rotateInUpRight;
+  animation-name: rotateInUpRight;
+}
+
+@-webkit-keyframes rotateOut {
+  from {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: rotate3d(0, 0, 1, 200deg);
+    transform: rotate3d(0, 0, 1, 200deg);
+    opacity: 0;
+  }
+}
+
+@keyframes rotateOut {
+  from {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: center;
+    transform-origin: center;
+    -webkit-transform: rotate3d(0, 0, 1, 200deg);
+    transform: rotate3d(0, 0, 1, 200deg);
+    opacity: 0;
+  }
+}
+
+.rotateOut {
+  -webkit-animation-name: rotateOut;
+  animation-name: rotateOut;
+}
+
+@-webkit-keyframes rotateOutDownLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+}
+
+@keyframes rotateOutDownLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 45deg);
+    transform: rotate3d(0, 0, 1, 45deg);
+    opacity: 0;
+  }
+}
+
+.rotateOutDownLeft {
+  -webkit-animation-name: rotateOutDownLeft;
+  animation-name: rotateOutDownLeft;
+}
+
+@-webkit-keyframes rotateOutDownRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+}
+
+@keyframes rotateOutDownRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+}
+
+.rotateOutDownRight {
+  -webkit-animation-name: rotateOutDownRight;
+  animation-name: rotateOutDownRight;
+}
+
+@-webkit-keyframes rotateOutUpLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+}
+
+@keyframes rotateOutUpLeft {
+  from {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: left bottom;
+    transform-origin: left bottom;
+    -webkit-transform: rotate3d(0, 0, 1, -45deg);
+    transform: rotate3d(0, 0, 1, -45deg);
+    opacity: 0;
+  }
+}
+
+.rotateOutUpLeft {
+  -webkit-animation-name: rotateOutUpLeft;
+  animation-name: rotateOutUpLeft;
+}
+
+@-webkit-keyframes rotateOutUpRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 90deg);
+    transform: rotate3d(0, 0, 1, 90deg);
+    opacity: 0;
+  }
+}
+
+@keyframes rotateOutUpRight {
+  from {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform-origin: right bottom;
+    transform-origin: right bottom;
+    -webkit-transform: rotate3d(0, 0, 1, 90deg);
+    transform: rotate3d(0, 0, 1, 90deg);
+    opacity: 0;
+  }
+}
+
+.rotateOutUpRight {
+  -webkit-animation-name: rotateOutUpRight;
+  animation-name: rotateOutUpRight;
+}
+
+@-webkit-keyframes hinge {
+  0% {
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+  }
+
+  20%,
+  60% {
+    -webkit-transform: rotate3d(0, 0, 1, 80deg);
+    transform: rotate3d(0, 0, 1, 80deg);
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+  }
+
+  40%,
+  80% {
+    -webkit-transform: rotate3d(0, 0, 1, 60deg);
+    transform: rotate3d(0, 0, 1, 60deg);
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 700px, 0);
+    transform: translate3d(0, 700px, 0);
+    opacity: 0;
+  }
+}
+
+@keyframes hinge {
+  0% {
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+  }
+
+  20%,
+  60% {
+    -webkit-transform: rotate3d(0, 0, 1, 80deg);
+    transform: rotate3d(0, 0, 1, 80deg);
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+  }
+
+  40%,
+  80% {
+    -webkit-transform: rotate3d(0, 0, 1, 60deg);
+    transform: rotate3d(0, 0, 1, 60deg);
+    -webkit-transform-origin: top left;
+    transform-origin: top left;
+    -webkit-animation-timing-function: ease-in-out;
+    animation-timing-function: ease-in-out;
+    opacity: 1;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 700px, 0);
+    transform: translate3d(0, 700px, 0);
+    opacity: 0;
+  }
+}
+
+.hinge {
+  -webkit-animation-duration: 2s;
+  animation-duration: 2s;
+  -webkit-animation-name: hinge;
+  animation-name: hinge;
+}
+
+@-webkit-keyframes jackInTheBox {
+  from {
+    opacity: 0;
+    -webkit-transform: scale(0.1) rotate(30deg);
+    transform: scale(0.1) rotate(30deg);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+  }
+
+  50% {
+    -webkit-transform: rotate(-10deg);
+    transform: rotate(-10deg);
+  }
+
+  70% {
+    -webkit-transform: rotate(3deg);
+    transform: rotate(3deg);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+}
+
+@keyframes jackInTheBox {
+  from {
+    opacity: 0;
+    -webkit-transform: scale(0.1) rotate(30deg);
+    transform: scale(0.1) rotate(30deg);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+  }
+
+  50% {
+    -webkit-transform: rotate(-10deg);
+    transform: rotate(-10deg);
+  }
+
+  70% {
+    -webkit-transform: rotate(3deg);
+    transform: rotate(3deg);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: scale(1);
+    transform: scale(1);
+  }
+}
+
+.jackInTheBox {
+  -webkit-animation-name: jackInTheBox;
+  animation-name: jackInTheBox;
+}
+
+/* originally authored by Nick Pettit - https://github.com/nickpettit/glide */
+
+@-webkit-keyframes rollIn {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0) rotate3d(0, 0, 1, -120deg);
+    transform: translate3d(-100%, 0, 0) rotate3d(0, 0, 1, -120deg);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes rollIn {
+  from {
+    opacity: 0;
+    -webkit-transform: translate3d(-100%, 0, 0) rotate3d(0, 0, 1, -120deg);
+    transform: translate3d(-100%, 0, 0) rotate3d(0, 0, 1, -120deg);
+  }
+
+  to {
+    opacity: 1;
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.rollIn {
+  -webkit-animation-name: rollIn;
+  animation-name: rollIn;
+}
+
+/* originally authored by Nick Pettit - https://github.com/nickpettit/glide */
+
+@-webkit-keyframes rollOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0) rotate3d(0, 0, 1, 120deg);
+    transform: translate3d(100%, 0, 0) rotate3d(0, 0, 1, 120deg);
+  }
+}
+
+@keyframes rollOut {
+  from {
+    opacity: 1;
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: translate3d(100%, 0, 0) rotate3d(0, 0, 1, 120deg);
+    transform: translate3d(100%, 0, 0) rotate3d(0, 0, 1, 120deg);
+  }
+}
+
+.rollOut {
+  -webkit-animation-name: rollOut;
+  animation-name: rollOut;
+}
+
+@-webkit-keyframes zoomIn {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  50% {
+    opacity: 1;
+  }
+}
+
+@keyframes zoomIn {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  50% {
+    opacity: 1;
+  }
+}
+
+.zoomIn {
+  -webkit-animation-name: zoomIn;
+  animation-name: zoomIn;
+}
+
+@-webkit-keyframes zoomInDown {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -1000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -1000px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomInDown {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -1000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -1000px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomInDown {
+  -webkit-animation-name: zoomInDown;
+  animation-name: zoomInDown;
+}
+
+@-webkit-keyframes zoomInLeft {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(-1000px, 0, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(-1000px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(10px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(10px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomInLeft {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(-1000px, 0, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(-1000px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(10px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(10px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomInLeft {
+  -webkit-animation-name: zoomInLeft;
+  animation-name: zoomInLeft;
+}
+
+@-webkit-keyframes zoomInRight {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(1000px, 0, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(1000px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(-10px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(-10px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomInRight {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(1000px, 0, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(1000px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(-10px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(-10px, 0, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomInRight {
+  -webkit-animation-name: zoomInRight;
+  animation-name: zoomInRight;
+}
+
+@-webkit-keyframes zoomInUp {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 1000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 1000px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomInUp {
+  from {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 1000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 1000px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  60% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomInUp {
+  -webkit-animation-name: zoomInUp;
+  animation-name: zoomInUp;
+}
+
+@-webkit-keyframes zoomOut {
+  from {
+    opacity: 1;
+  }
+
+  50% {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  to {
+    opacity: 0;
+  }
+}
+
+@keyframes zoomOut {
+  from {
+    opacity: 1;
+  }
+
+  50% {
+    opacity: 0;
+    -webkit-transform: scale3d(0.3, 0.3, 0.3);
+    transform: scale3d(0.3, 0.3, 0.3);
+  }
+
+  to {
+    opacity: 0;
+  }
+}
+
+.zoomOut {
+  -webkit-animation-name: zoomOut;
+  animation-name: zoomOut;
+}
+
+@-webkit-keyframes zoomOutDown {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 2000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 2000px, 0);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomOutDown {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, -60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 2000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, 2000px, 0);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomOutDown {
+  -webkit-animation-name: zoomOutDown;
+  animation-name: zoomOutDown;
+}
+
+@-webkit-keyframes zoomOutLeft {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(42px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(42px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale(0.1) translate3d(-2000px, 0, 0);
+    transform: scale(0.1) translate3d(-2000px, 0, 0);
+    -webkit-transform-origin: left center;
+    transform-origin: left center;
+  }
+}
+
+@keyframes zoomOutLeft {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(42px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(42px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale(0.1) translate3d(-2000px, 0, 0);
+    transform: scale(0.1) translate3d(-2000px, 0, 0);
+    -webkit-transform-origin: left center;
+    transform-origin: left center;
+  }
+}
+
+.zoomOutLeft {
+  -webkit-animation-name: zoomOutLeft;
+  animation-name: zoomOutLeft;
+}
+
+@-webkit-keyframes zoomOutRight {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(-42px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(-42px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale(0.1) translate3d(2000px, 0, 0);
+    transform: scale(0.1) translate3d(2000px, 0, 0);
+    -webkit-transform-origin: right center;
+    transform-origin: right center;
+  }
+}
+
+@keyframes zoomOutRight {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(-42px, 0, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(-42px, 0, 0);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale(0.1) translate3d(2000px, 0, 0);
+    transform: scale(0.1) translate3d(2000px, 0, 0);
+    -webkit-transform-origin: right center;
+    transform-origin: right center;
+  }
+}
+
+.zoomOutRight {
+  -webkit-animation-name: zoomOutRight;
+  animation-name: zoomOutRight;
+}
+
+@-webkit-keyframes zoomOutUp {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -2000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -2000px, 0);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+@keyframes zoomOutUp {
+  40% {
+    opacity: 1;
+    -webkit-transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    transform: scale3d(0.475, 0.475, 0.475) translate3d(0, 60px, 0);
+    -webkit-animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+    animation-timing-function: cubic-bezier(0.55, 0.055, 0.675, 0.19);
+  }
+
+  to {
+    opacity: 0;
+    -webkit-transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -2000px, 0);
+    transform: scale3d(0.1, 0.1, 0.1) translate3d(0, -2000px, 0);
+    -webkit-transform-origin: center bottom;
+    transform-origin: center bottom;
+    -webkit-animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+    animation-timing-function: cubic-bezier(0.175, 0.885, 0.32, 1);
+  }
+}
+
+.zoomOutUp {
+  -webkit-animation-name: zoomOutUp;
+  animation-name: zoomOutUp;
+}
+
+@-webkit-keyframes slideInDown {
+  from {
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes slideInDown {
+  from {
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.slideInDown {
+  -webkit-animation-name: slideInDown;
+  animation-name: slideInDown;
+}
+
+@-webkit-keyframes slideInLeft {
+  from {
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes slideInLeft {
+  from {
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.slideInLeft {
+  -webkit-animation-name: slideInLeft;
+  animation-name: slideInLeft;
+}
+
+@-webkit-keyframes slideInRight {
+  from {
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes slideInRight {
+  from {
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.slideInRight {
+  -webkit-animation-name: slideInRight;
+  animation-name: slideInRight;
+}
+
+@-webkit-keyframes slideInUp {
+  from {
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+@keyframes slideInUp {
+  from {
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+    visibility: visible;
+  }
+
+  to {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+}
+
+.slideInUp {
+  -webkit-animation-name: slideInUp;
+  animation-name: slideInUp;
+}
+
+@-webkit-keyframes slideOutDown {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+}
+
+@keyframes slideOutDown {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(0, 100%, 0);
+    transform: translate3d(0, 100%, 0);
+  }
+}
+
+.slideOutDown {
+  -webkit-animation-name: slideOutDown;
+  animation-name: slideOutDown;
+}
+
+@-webkit-keyframes slideOutLeft {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+}
+
+@keyframes slideOutLeft {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(-100%, 0, 0);
+    transform: translate3d(-100%, 0, 0);
+  }
+}
+
+.slideOutLeft {
+  -webkit-animation-name: slideOutLeft;
+  animation-name: slideOutLeft;
+}
+
+@-webkit-keyframes slideOutRight {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+}
+
+@keyframes slideOutRight {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(100%, 0, 0);
+    transform: translate3d(100%, 0, 0);
+  }
+}
+
+.slideOutRight {
+  -webkit-animation-name: slideOutRight;
+  animation-name: slideOutRight;
+}
+
+@-webkit-keyframes slideOutUp {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+}
+
+@keyframes slideOutUp {
+  from {
+    -webkit-transform: translate3d(0, 0, 0);
+    transform: translate3d(0, 0, 0);
+  }
+
+  to {
+    visibility: hidden;
+    -webkit-transform: translate3d(0, -100%, 0);
+    transform: translate3d(0, -100%, 0);
+  }
+}
+
+.slideOutUp {
+  -webkit-animation-name: slideOutUp;
+  animation-name: slideOutUp;
+}
+
+.animated {
+  -webkit-animation-duration: 1s;
+  animation-duration: 1s;
+  -webkit-animation-fill-mode: both;
+  animation-fill-mode: both;
+}
+
+.animated.infinite {
+  -webkit-animation-iteration-count: infinite;
+  animation-iteration-count: infinite;
+}
+
+.animated.delay-1s {
+  -webkit-animation-delay: 1s;
+  animation-delay: 1s;
+}
+
+.animated.delay-2s {
+  -webkit-animation-delay: 2s;
+  animation-delay: 2s;
+}
+
+.animated.delay-3s {
+  -webkit-animation-delay: 3s;
+  animation-delay: 3s;
+}
+
+.animated.delay-4s {
+  -webkit-animation-delay: 4s;
+  animation-delay: 4s;
+}
+
+.animated.delay-5s {
+  -webkit-animation-delay: 5s;
+  animation-delay: 5s;
+}
+
+.animated.fast {
+  -webkit-animation-duration: 800ms;
+  animation-duration: 800ms;
+}
+
+.animated.faster {
+  -webkit-animation-duration: 500ms;
+  animation-duration: 500ms;
+}
+
+.animated.slow {
+  -webkit-animation-duration: 2s;
+  animation-duration: 2s;
+}
+
+.animated.slower {
+  -webkit-animation-duration: 3s;
+  animation-duration: 3s;
+}
+
+@media (prefers-reduced-motion) {
+  .animated {
+    -webkit-animation: unset !important;
+    animation: unset !important;
+    -webkit-transition: none !important;
+    transition: none !important;
+  }
+}
diff --git a/plugins/bootstrap/bootstrap.min.css b/plugins/bootstrap/bootstrap.min.css
new file mode 100644
index 00000000..7aebd0ff
--- /dev/null
+++ b/plugins/bootstrap/bootstrap.min.css
@@ -0,0 +1,7 @@
+/*!
+ * Bootstrap v4.1.1 (https://getbootstrap.com/)
+ * Copyright 2011-2018 The Bootstrap Authors
+ * Copyright 2011-2018 Twitter, Inc.
+ * Licensed under MIT (https://github.com/twbs/bootstrap/blob/master/LICENSE)
+ */:root{--blue:#007bff;--indigo:#6610f2;--purple:#6f42c1;--pink:#e83e8c;--red:#dc3545;--orange:#fd7e14;--yellow:#ffc107;--green:#28a745;--teal:#20c997;--cyan:#17a2b8;--white:#fff;--gray:#6c757d;--gray-dark:#343a40;--primary:#007bff;--secondary:#6c757d;--success:#28a745;--info:#17a2b8;--warning:#ffc107;--danger:#dc3545;--light:#f8f9fa;--dark:#343a40;--breakpoint-xs:0;--breakpoint-sm:576px;--breakpoint-md:768px;--breakpoint-lg:992px;--breakpoint-xl:1200px;--font-family-sans-serif:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,"Helvetica Neue",Arial,sans-serif,"Apple Color Emoji","Segoe UI Emoji","Segoe UI Symbol";--font-family-monospace:SFMono-Regular,Menlo,Monaco,Consolas,"Liberation Mono","Courier New",monospace}*,::after,::before{box-sizing:border-box}html{font-family:sans-serif;line-height:1.15;-webkit-text-size-adjust:100%;-ms-text-size-adjust:100%;-ms-overflow-style:scrollbar;-webkit-tap-highlight-color:transparent}@-ms-viewport{width:device-width}article,aside,figcaption,figure,footer,header,hgroup,main,nav,section{display:block}body{margin:0;font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,"Helvetica Neue",Arial,sans-serif,"Apple Color Emoji","Segoe UI Emoji","Segoe UI Symbol";font-size:1rem;font-weight:400;line-height:1.5;color:#212529;text-align:left;background-color:#fff}[tabindex="-1"]:focus{outline:0!important}hr{box-sizing:content-box;height:0;overflow:visible}h1,h2,h3,h4,h5,h6{margin-top:0;margin-bottom:.5rem}p{margin-top:0;margin-bottom:1rem}abbr[data-original-title],abbr[title]{text-decoration:underline;-webkit-text-decoration:underline dotted;text-decoration:underline dotted;cursor:help;border-bottom:0}address{margin-bottom:1rem;font-style:normal;line-height:inherit}dl,ol,ul{margin-top:0;margin-bottom:1rem}ol ol,ol ul,ul ol,ul ul{margin-bottom:0}dt{font-weight:700}dd{margin-bottom:.5rem;margin-left:0}blockquote{margin:0 0 1rem}dfn{font-style:italic}b,strong{font-weight:bolder}small{font-size:80%}sub,sup{position:relative;font-size:75%;line-height:0;vertical-align:baseline}sub{bottom:-.25em}sup{top:-.5em}a{color:#007bff;text-decoration:none;background-color:transparent;-webkit-text-decoration-skip:objects}a:hover{color:#0056b3;text-decoration:underline}a:not([href]):not([tabindex]){color:inherit;text-decoration:none}a:not([href]):not([tabindex]):focus,a:not([href]):not([tabindex]):hover{color:inherit;text-decoration:none}a:not([href]):not([tabindex]):focus{outline:0}code,kbd,pre,samp{font-family:SFMono-Regular,Menlo,Monaco,Consolas,"Liberation Mono","Courier New",monospace;font-size:1em}pre{margin-top:0;margin-bottom:1rem;overflow:auto;-ms-overflow-style:scrollbar}figure{margin:0 0 1rem}img{vertical-align:middle;border-style:none}svg:not(:root){overflow:hidden}table{border-collapse:collapse}caption{padding-top:.75rem;padding-bottom:.75rem;color:#6c757d;text-align:left;caption-side:bottom}th{text-align:inherit}label{display:inline-block;margin-bottom:.5rem}button{border-radius:0}button:focus{outline:1px dotted;outline:5px auto -webkit-focus-ring-color}button,input,optgroup,select,textarea{margin:0;font-family:inherit;font-size:inherit;line-height:inherit}button,input{overflow:visible}button,select{text-transform:none}[type=reset],[type=submit],button,html [type=button]{-webkit-appearance:button}[type=button]::-moz-focus-inner,[type=reset]::-moz-focus-inner,[type=submit]::-moz-focus-inner,button::-moz-focus-inner{padding:0;border-style:none}input[type=checkbox],input[type=radio]{box-sizing:border-box;padding:0}input[type=date],input[type=datetime-local],input[type=month],input[type=time]{-webkit-appearance:listbox}textarea{overflow:auto;resize:vertical}fieldset{min-width:0;padding:0;margin:0;border:0}legend{display:block;width:100%;max-width:100%;padding:0;margin-bottom:.5rem;font-size:1.5rem;line-height:inherit;color:inherit;white-space:normal}progress{vertical-align:baseline}[type=number]::-webkit-inner-spin-button,[type=number]::-webkit-outer-spin-button{height:auto}[type=search]{outline-offset:-2px;-webkit-appearance:none}[type=search]::-webkit-search-cancel-button,[type=search]::-webkit-search-decoration{-webkit-appearance:none}::-webkit-file-upload-button{font:inherit;-webkit-appearance:button}output{display:inline-block}summary{display:list-item;cursor:pointer}template{display:none}[hidden]{display:none!important}.h1,.h2,.h3,.h4,.h5,.h6,h1,h2,h3,h4,h5,h6{margin-bottom:.5rem;font-family:inherit;font-weight:500;line-height:1.2;color:inherit}.h1,h1{font-size:2.5rem}.h2,h2{font-size:2rem}.h3,h3{font-size:1.75rem}.h4,h4{font-size:1.5rem}.h5,h5{font-size:1.25rem}.h6,h6{font-size:1rem}.lead{font-size:1.25rem;font-weight:300}.display-1{font-size:6rem;font-weight:300;line-height:1.2}.display-2{font-size:5.5rem;font-weight:300;line-height:1.2}.display-3{font-size:4.5rem;font-weight:300;line-height:1.2}.display-4{font-size:3.5rem;font-weight:300;line-height:1.2}hr{margin-top:1rem;margin-bottom:1rem;border:0;border-top:1px solid rgba(0,0,0,.1)}.small,small{font-size:80%;font-weight:400}.mark,mark{padding:.2em;background-color:#fcf8e3}.list-unstyled{padding-left:0;list-style:none}.list-inline{padding-left:0;list-style:none}.list-inline-item{display:inline-block}.list-inline-item:not(:last-child){margin-right:.5rem}.initialism{font-size:90%;text-transform:uppercase}.blockquote{margin-bottom:1rem;font-size:1.25rem}.blockquote-footer{display:block;font-size:80%;color:#6c757d}.blockquote-footer::before{content:"\2014 \00A0"}.img-fluid{max-width:100%;height:auto}.img-thumbnail{padding:.25rem;background-color:#fff;border:1px solid #dee2e6;border-radius:.25rem;max-width:100%;height:auto}.figure{display:inline-block}.figure-img{margin-bottom:.5rem;line-height:1}.figure-caption{font-size:90%;color:#6c757d}code{font-size:87.5%;color:#e83e8c;word-break:break-word}a>code{color:inherit}kbd{padding:.2rem .4rem;font-size:87.5%;color:#fff;background-color:#212529;border-radius:.2rem}kbd kbd{padding:0;font-size:100%;font-weight:700}pre{display:block;font-size:87.5%;color:#212529}pre code{font-size:inherit;color:inherit;word-break:normal}.pre-scrollable{max-height:340px;overflow-y:scroll}.container{width:100%;padding-right:15px;padding-left:15px;margin-right:auto;margin-left:auto}@media (min-width:576px){.container{max-width:540px}}@media (min-width:768px){.container{max-width:720px}}@media (min-width:992px){.container{max-width:960px}}@media (min-width:1200px){.container{max-width:1140px}}.container-fluid{width:100%;padding-right:15px;padding-left:15px;margin-right:auto;margin-left:auto}.row{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;margin-right:-15px;margin-left:-15px}.no-gutters{margin-right:0;margin-left:0}.no-gutters>.col,.no-gutters>[class*=col-]{padding-right:0;padding-left:0}.col,.col-1,.col-10,.col-11,.col-12,.col-2,.col-3,.col-4,.col-5,.col-6,.col-7,.col-8,.col-9,.col-auto,.col-lg,.col-lg-1,.col-lg-10,.col-lg-11,.col-lg-12,.col-lg-2,.col-lg-3,.col-lg-4,.col-lg-5,.col-lg-6,.col-lg-7,.col-lg-8,.col-lg-9,.col-lg-auto,.col-md,.col-md-1,.col-md-10,.col-md-11,.col-md-12,.col-md-2,.col-md-3,.col-md-4,.col-md-5,.col-md-6,.col-md-7,.col-md-8,.col-md-9,.col-md-auto,.col-sm,.col-sm-1,.col-sm-10,.col-sm-11,.col-sm-12,.col-sm-2,.col-sm-3,.col-sm-4,.col-sm-5,.col-sm-6,.col-sm-7,.col-sm-8,.col-sm-9,.col-sm-auto,.col-xl,.col-xl-1,.col-xl-10,.col-xl-11,.col-xl-12,.col-xl-2,.col-xl-3,.col-xl-4,.col-xl-5,.col-xl-6,.col-xl-7,.col-xl-8,.col-xl-9,.col-xl-auto{position:relative;width:100%;min-height:1px;padding-right:15px;padding-left:15px}.col{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;max-width:100%}.col-auto{-ms-flex:0 0 auto;flex:0 0 auto;width:auto;max-width:none}.col-1{-ms-flex:0 0 8.333333%;flex:0 0 8.333333%;max-width:8.333333%}.col-2{-ms-flex:0 0 16.666667%;flex:0 0 16.666667%;max-width:16.666667%}.col-3{-ms-flex:0 0 25%;flex:0 0 25%;max-width:25%}.col-4{-ms-flex:0 0 33.333333%;flex:0 0 33.333333%;max-width:33.333333%}.col-5{-ms-flex:0 0 41.666667%;flex:0 0 41.666667%;max-width:41.666667%}.col-6{-ms-flex:0 0 50%;flex:0 0 50%;max-width:50%}.col-7{-ms-flex:0 0 58.333333%;flex:0 0 58.333333%;max-width:58.333333%}.col-8{-ms-flex:0 0 66.666667%;flex:0 0 66.666667%;max-width:66.666667%}.col-9{-ms-flex:0 0 75%;flex:0 0 75%;max-width:75%}.col-10{-ms-flex:0 0 83.333333%;flex:0 0 83.333333%;max-width:83.333333%}.col-11{-ms-flex:0 0 91.666667%;flex:0 0 91.666667%;max-width:91.666667%}.col-12{-ms-flex:0 0 100%;flex:0 0 100%;max-width:100%}.order-first{-ms-flex-order:-1;order:-1}.order-last{-ms-flex-order:13;order:13}.order-0{-ms-flex-order:0;order:0}.order-1{-ms-flex-order:1;order:1}.order-2{-ms-flex-order:2;order:2}.order-3{-ms-flex-order:3;order:3}.order-4{-ms-flex-order:4;order:4}.order-5{-ms-flex-order:5;order:5}.order-6{-ms-flex-order:6;order:6}.order-7{-ms-flex-order:7;order:7}.order-8{-ms-flex-order:8;order:8}.order-9{-ms-flex-order:9;order:9}.order-10{-ms-flex-order:10;order:10}.order-11{-ms-flex-order:11;order:11}.order-12{-ms-flex-order:12;order:12}.offset-1{margin-left:8.333333%}.offset-2{margin-left:16.666667%}.offset-3{margin-left:25%}.offset-4{margin-left:33.333333%}.offset-5{margin-left:41.666667%}.offset-6{margin-left:50%}.offset-7{margin-left:58.333333%}.offset-8{margin-left:66.666667%}.offset-9{margin-left:75%}.offset-10{margin-left:83.333333%}.offset-11{margin-left:91.666667%}@media (min-width:576px){.col-sm{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;max-width:100%}.col-sm-auto{-ms-flex:0 0 auto;flex:0 0 auto;width:auto;max-width:none}.col-sm-1{-ms-flex:0 0 8.333333%;flex:0 0 8.333333%;max-width:8.333333%}.col-sm-2{-ms-flex:0 0 16.666667%;flex:0 0 16.666667%;max-width:16.666667%}.col-sm-3{-ms-flex:0 0 25%;flex:0 0 25%;max-width:25%}.col-sm-4{-ms-flex:0 0 33.333333%;flex:0 0 33.333333%;max-width:33.333333%}.col-sm-5{-ms-flex:0 0 41.666667%;flex:0 0 41.666667%;max-width:41.666667%}.col-sm-6{-ms-flex:0 0 50%;flex:0 0 50%;max-width:50%}.col-sm-7{-ms-flex:0 0 58.333333%;flex:0 0 58.333333%;max-width:58.333333%}.col-sm-8{-ms-flex:0 0 66.666667%;flex:0 0 66.666667%;max-width:66.666667%}.col-sm-9{-ms-flex:0 0 75%;flex:0 0 75%;max-width:75%}.col-sm-10{-ms-flex:0 0 83.333333%;flex:0 0 83.333333%;max-width:83.333333%}.col-sm-11{-ms-flex:0 0 91.666667%;flex:0 0 91.666667%;max-width:91.666667%}.col-sm-12{-ms-flex:0 0 100%;flex:0 0 100%;max-width:100%}.order-sm-first{-ms-flex-order:-1;order:-1}.order-sm-last{-ms-flex-order:13;order:13}.order-sm-0{-ms-flex-order:0;order:0}.order-sm-1{-ms-flex-order:1;order:1}.order-sm-2{-ms-flex-order:2;order:2}.order-sm-3{-ms-flex-order:3;order:3}.order-sm-4{-ms-flex-order:4;order:4}.order-sm-5{-ms-flex-order:5;order:5}.order-sm-6{-ms-flex-order:6;order:6}.order-sm-7{-ms-flex-order:7;order:7}.order-sm-8{-ms-flex-order:8;order:8}.order-sm-9{-ms-flex-order:9;order:9}.order-sm-10{-ms-flex-order:10;order:10}.order-sm-11{-ms-flex-order:11;order:11}.order-sm-12{-ms-flex-order:12;order:12}.offset-sm-0{margin-left:0}.offset-sm-1{margin-left:8.333333%}.offset-sm-2{margin-left:16.666667%}.offset-sm-3{margin-left:25%}.offset-sm-4{margin-left:33.333333%}.offset-sm-5{margin-left:41.666667%}.offset-sm-6{margin-left:50%}.offset-sm-7{margin-left:58.333333%}.offset-sm-8{margin-left:66.666667%}.offset-sm-9{margin-left:75%}.offset-sm-10{margin-left:83.333333%}.offset-sm-11{margin-left:91.666667%}}@media (min-width:768px){.col-md{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;max-width:100%}.col-md-auto{-ms-flex:0 0 auto;flex:0 0 auto;width:auto;max-width:none}.col-md-1{-ms-flex:0 0 8.333333%;flex:0 0 8.333333%;max-width:8.333333%}.col-md-2{-ms-flex:0 0 16.666667%;flex:0 0 16.666667%;max-width:16.666667%}.col-md-3{-ms-flex:0 0 25%;flex:0 0 25%;max-width:25%}.col-md-4{-ms-flex:0 0 33.333333%;flex:0 0 33.333333%;max-width:33.333333%}.col-md-5{-ms-flex:0 0 41.666667%;flex:0 0 41.666667%;max-width:41.666667%}.col-md-6{-ms-flex:0 0 50%;flex:0 0 50%;max-width:50%}.col-md-7{-ms-flex:0 0 58.333333%;flex:0 0 58.333333%;max-width:58.333333%}.col-md-8{-ms-flex:0 0 66.666667%;flex:0 0 66.666667%;max-width:66.666667%}.col-md-9{-ms-flex:0 0 75%;flex:0 0 75%;max-width:75%}.col-md-10{-ms-flex:0 0 83.333333%;flex:0 0 83.333333%;max-width:83.333333%}.col-md-11{-ms-flex:0 0 91.666667%;flex:0 0 91.666667%;max-width:91.666667%}.col-md-12{-ms-flex:0 0 100%;flex:0 0 100%;max-width:100%}.order-md-first{-ms-flex-order:-1;order:-1}.order-md-last{-ms-flex-order:13;order:13}.order-md-0{-ms-flex-order:0;order:0}.order-md-1{-ms-flex-order:1;order:1}.order-md-2{-ms-flex-order:2;order:2}.order-md-3{-ms-flex-order:3;order:3}.order-md-4{-ms-flex-order:4;order:4}.order-md-5{-ms-flex-order:5;order:5}.order-md-6{-ms-flex-order:6;order:6}.order-md-7{-ms-flex-order:7;order:7}.order-md-8{-ms-flex-order:8;order:8}.order-md-9{-ms-flex-order:9;order:9}.order-md-10{-ms-flex-order:10;order:10}.order-md-11{-ms-flex-order:11;order:11}.order-md-12{-ms-flex-order:12;order:12}.offset-md-0{margin-left:0}.offset-md-1{margin-left:8.333333%}.offset-md-2{margin-left:16.666667%}.offset-md-3{margin-left:25%}.offset-md-4{margin-left:33.333333%}.offset-md-5{margin-left:41.666667%}.offset-md-6{margin-left:50%}.offset-md-7{margin-left:58.333333%}.offset-md-8{margin-left:66.666667%}.offset-md-9{margin-left:75%}.offset-md-10{margin-left:83.333333%}.offset-md-11{margin-left:91.666667%}}@media (min-width:992px){.col-lg{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;max-width:100%}.col-lg-auto{-ms-flex:0 0 auto;flex:0 0 auto;width:auto;max-width:none}.col-lg-1{-ms-flex:0 0 8.333333%;flex:0 0 8.333333%;max-width:8.333333%}.col-lg-2{-ms-flex:0 0 16.666667%;flex:0 0 16.666667%;max-width:16.666667%}.col-lg-3{-ms-flex:0 0 25%;flex:0 0 25%;max-width:25%}.col-lg-4{-ms-flex:0 0 33.333333%;flex:0 0 33.333333%;max-width:33.333333%}.col-lg-5{-ms-flex:0 0 41.666667%;flex:0 0 41.666667%;max-width:41.666667%}.col-lg-6{-ms-flex:0 0 50%;flex:0 0 50%;max-width:50%}.col-lg-7{-ms-flex:0 0 58.333333%;flex:0 0 58.333333%;max-width:58.333333%}.col-lg-8{-ms-flex:0 0 66.666667%;flex:0 0 66.666667%;max-width:66.666667%}.col-lg-9{-ms-flex:0 0 75%;flex:0 0 75%;max-width:75%}.col-lg-10{-ms-flex:0 0 83.333333%;flex:0 0 83.333333%;max-width:83.333333%}.col-lg-11{-ms-flex:0 0 91.666667%;flex:0 0 91.666667%;max-width:91.666667%}.col-lg-12{-ms-flex:0 0 100%;flex:0 0 100%;max-width:100%}.order-lg-first{-ms-flex-order:-1;order:-1}.order-lg-last{-ms-flex-order:13;order:13}.order-lg-0{-ms-flex-order:0;order:0}.order-lg-1{-ms-flex-order:1;order:1}.order-lg-2{-ms-flex-order:2;order:2}.order-lg-3{-ms-flex-order:3;order:3}.order-lg-4{-ms-flex-order:4;order:4}.order-lg-5{-ms-flex-order:5;order:5}.order-lg-6{-ms-flex-order:6;order:6}.order-lg-7{-ms-flex-order:7;order:7}.order-lg-8{-ms-flex-order:8;order:8}.order-lg-9{-ms-flex-order:9;order:9}.order-lg-10{-ms-flex-order:10;order:10}.order-lg-11{-ms-flex-order:11;order:11}.order-lg-12{-ms-flex-order:12;order:12}.offset-lg-0{margin-left:0}.offset-lg-1{margin-left:8.333333%}.offset-lg-2{margin-left:16.666667%}.offset-lg-3{margin-left:25%}.offset-lg-4{margin-left:33.333333%}.offset-lg-5{margin-left:41.666667%}.offset-lg-6{margin-left:50%}.offset-lg-7{margin-left:58.333333%}.offset-lg-8{margin-left:66.666667%}.offset-lg-9{margin-left:75%}.offset-lg-10{margin-left:83.333333%}.offset-lg-11{margin-left:91.666667%}}@media (min-width:1200px){.col-xl{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;max-width:100%}.col-xl-auto{-ms-flex:0 0 auto;flex:0 0 auto;width:auto;max-width:none}.col-xl-1{-ms-flex:0 0 8.333333%;flex:0 0 8.333333%;max-width:8.333333%}.col-xl-2{-ms-flex:0 0 16.666667%;flex:0 0 16.666667%;max-width:16.666667%}.col-xl-3{-ms-flex:0 0 25%;flex:0 0 25%;max-width:25%}.col-xl-4{-ms-flex:0 0 33.333333%;flex:0 0 33.333333%;max-width:33.333333%}.col-xl-5{-ms-flex:0 0 41.666667%;flex:0 0 41.666667%;max-width:41.666667%}.col-xl-6{-ms-flex:0 0 50%;flex:0 0 50%;max-width:50%}.col-xl-7{-ms-flex:0 0 58.333333%;flex:0 0 58.333333%;max-width:58.333333%}.col-xl-8{-ms-flex:0 0 66.666667%;flex:0 0 66.666667%;max-width:66.666667%}.col-xl-9{-ms-flex:0 0 75%;flex:0 0 75%;max-width:75%}.col-xl-10{-ms-flex:0 0 83.333333%;flex:0 0 83.333333%;max-width:83.333333%}.col-xl-11{-ms-flex:0 0 91.666667%;flex:0 0 91.666667%;max-width:91.666667%}.col-xl-12{-ms-flex:0 0 100%;flex:0 0 100%;max-width:100%}.order-xl-first{-ms-flex-order:-1;order:-1}.order-xl-last{-ms-flex-order:13;order:13}.order-xl-0{-ms-flex-order:0;order:0}.order-xl-1{-ms-flex-order:1;order:1}.order-xl-2{-ms-flex-order:2;order:2}.order-xl-3{-ms-flex-order:3;order:3}.order-xl-4{-ms-flex-order:4;order:4}.order-xl-5{-ms-flex-order:5;order:5}.order-xl-6{-ms-flex-order:6;order:6}.order-xl-7{-ms-flex-order:7;order:7}.order-xl-8{-ms-flex-order:8;order:8}.order-xl-9{-ms-flex-order:9;order:9}.order-xl-10{-ms-flex-order:10;order:10}.order-xl-11{-ms-flex-order:11;order:11}.order-xl-12{-ms-flex-order:12;order:12}.offset-xl-0{margin-left:0}.offset-xl-1{margin-left:8.333333%}.offset-xl-2{margin-left:16.666667%}.offset-xl-3{margin-left:25%}.offset-xl-4{margin-left:33.333333%}.offset-xl-5{margin-left:41.666667%}.offset-xl-6{margin-left:50%}.offset-xl-7{margin-left:58.333333%}.offset-xl-8{margin-left:66.666667%}.offset-xl-9{margin-left:75%}.offset-xl-10{margin-left:83.333333%}.offset-xl-11{margin-left:91.666667%}}.table{width:100%;max-width:100%;margin-bottom:1rem;background-color:transparent}.table td,.table th{padding:.75rem;vertical-align:top;border-top:1px solid #dee2e6}.table thead th{vertical-align:bottom;border-bottom:2px solid #dee2e6}.table tbody+tbody{border-top:2px solid #dee2e6}.table .table{background-color:#fff}.table-sm td,.table-sm th{padding:.3rem}.table-bordered{border:1px solid #dee2e6}.table-bordered td,.table-bordered th{border:1px solid #dee2e6}.table-bordered thead td,.table-bordered thead th{border-bottom-width:2px}.table-borderless tbody+tbody,.table-borderless td,.table-borderless th,.table-borderless thead th{border:0}.table-striped tbody tr:nth-of-type(odd){background-color:rgba(0,0,0,.05)}.table-hover tbody tr:hover{background-color:rgba(0,0,0,.075)}.table-primary,.table-primary>td,.table-primary>th{background-color:#b8daff}.table-hover .table-primary:hover{background-color:#9fcdff}.table-hover .table-primary:hover>td,.table-hover .table-primary:hover>th{background-color:#9fcdff}.table-secondary,.table-secondary>td,.table-secondary>th{background-color:#d6d8db}.table-hover .table-secondary:hover{background-color:#c8cbcf}.table-hover .table-secondary:hover>td,.table-hover .table-secondary:hover>th{background-color:#c8cbcf}.table-success,.table-success>td,.table-success>th{background-color:#c3e6cb}.table-hover .table-success:hover{background-color:#b1dfbb}.table-hover .table-success:hover>td,.table-hover .table-success:hover>th{background-color:#b1dfbb}.table-info,.table-info>td,.table-info>th{background-color:#bee5eb}.table-hover .table-info:hover{background-color:#abdde5}.table-hover .table-info:hover>td,.table-hover .table-info:hover>th{background-color:#abdde5}.table-warning,.table-warning>td,.table-warning>th{background-color:#ffeeba}.table-hover .table-warning:hover{background-color:#ffe8a1}.table-hover .table-warning:hover>td,.table-hover .table-warning:hover>th{background-color:#ffe8a1}.table-danger,.table-danger>td,.table-danger>th{background-color:#f5c6cb}.table-hover .table-danger:hover{background-color:#f1b0b7}.table-hover .table-danger:hover>td,.table-hover .table-danger:hover>th{background-color:#f1b0b7}.table-light,.table-light>td,.table-light>th{background-color:#fdfdfe}.table-hover .table-light:hover{background-color:#ececf6}.table-hover .table-light:hover>td,.table-hover .table-light:hover>th{background-color:#ececf6}.table-dark,.table-dark>td,.table-dark>th{background-color:#c6c8ca}.table-hover .table-dark:hover{background-color:#b9bbbe}.table-hover .table-dark:hover>td,.table-hover .table-dark:hover>th{background-color:#b9bbbe}.table-active,.table-active>td,.table-active>th{background-color:rgba(0,0,0,.075)}.table-hover .table-active:hover{background-color:rgba(0,0,0,.075)}.table-hover .table-active:hover>td,.table-hover .table-active:hover>th{background-color:rgba(0,0,0,.075)}.table .thead-dark th{color:#fff;background-color:#212529;border-color:#32383e}.table .thead-light th{color:#495057;background-color:#e9ecef;border-color:#dee2e6}.table-dark{color:#fff;background-color:#212529}.table-dark td,.table-dark th,.table-dark thead th{border-color:#32383e}.table-dark.table-bordered{border:0}.table-dark.table-striped tbody tr:nth-of-type(odd){background-color:rgba(255,255,255,.05)}.table-dark.table-hover tbody tr:hover{background-color:rgba(255,255,255,.075)}@media (max-width:575.98px){.table-responsive-sm{display:block;width:100%;overflow-x:auto;-webkit-overflow-scrolling:touch;-ms-overflow-style:-ms-autohiding-scrollbar}.table-responsive-sm>.table-bordered{border:0}}@media (max-width:767.98px){.table-responsive-md{display:block;width:100%;overflow-x:auto;-webkit-overflow-scrolling:touch;-ms-overflow-style:-ms-autohiding-scrollbar}.table-responsive-md>.table-bordered{border:0}}@media (max-width:991.98px){.table-responsive-lg{display:block;width:100%;overflow-x:auto;-webkit-overflow-scrolling:touch;-ms-overflow-style:-ms-autohiding-scrollbar}.table-responsive-lg>.table-bordered{border:0}}@media (max-width:1199.98px){.table-responsive-xl{display:block;width:100%;overflow-x:auto;-webkit-overflow-scrolling:touch;-ms-overflow-style:-ms-autohiding-scrollbar}.table-responsive-xl>.table-bordered{border:0}}.table-responsive{display:block;width:100%;overflow-x:auto;-webkit-overflow-scrolling:touch;-ms-overflow-style:-ms-autohiding-scrollbar}.table-responsive>.table-bordered{border:0}.form-control{display:block;width:100%;padding:.375rem .75rem;font-size:1rem;line-height:1.5;color:#495057;background-color:#fff;background-clip:padding-box;border:1px solid #ced4da;border-radius:.25rem;transition:border-color .15s ease-in-out,box-shadow .15s ease-in-out}@media screen and (prefers-reduced-motion:reduce){.form-control{transition:none}}.form-control::-ms-expand{background-color:transparent;border:0}.form-control:focus{color:#495057;background-color:#fff;border-color:#80bdff;outline:0;box-shadow:0 0 0 .2rem rgba(0,123,255,.25)}.form-control::-webkit-input-placeholder{color:#6c757d;opacity:1}.form-control::-moz-placeholder{color:#6c757d;opacity:1}.form-control:-ms-input-placeholder{color:#6c757d;opacity:1}.form-control::-ms-input-placeholder{color:#6c757d;opacity:1}.form-control::placeholder{color:#6c757d;opacity:1}.form-control:disabled,.form-control[readonly]{background-color:#e9ecef;opacity:1}select.form-control:not([size]):not([multiple]){height:calc(2.25rem + 2px)}select.form-control:focus::-ms-value{color:#495057;background-color:#fff}.form-control-file,.form-control-range{display:block;width:100%}.col-form-label{padding-top:calc(.375rem + 1px);padding-bottom:calc(.375rem + 1px);margin-bottom:0;font-size:inherit;line-height:1.5}.col-form-label-lg{padding-top:calc(.5rem + 1px);padding-bottom:calc(.5rem + 1px);font-size:1.25rem;line-height:1.5}.col-form-label-sm{padding-top:calc(.25rem + 1px);padding-bottom:calc(.25rem + 1px);font-size:.875rem;line-height:1.5}.form-control-plaintext{display:block;width:100%;padding-top:.375rem;padding-bottom:.375rem;margin-bottom:0;line-height:1.5;color:#212529;background-color:transparent;border:solid transparent;border-width:1px 0}.form-control-plaintext.form-control-lg,.form-control-plaintext.form-control-sm,.input-group-lg>.form-control-plaintext.form-control,.input-group-lg>.input-group-append>.form-control-plaintext.btn,.input-group-lg>.input-group-append>.form-control-plaintext.input-group-text,.input-group-lg>.input-group-prepend>.form-control-plaintext.btn,.input-group-lg>.input-group-prepend>.form-control-plaintext.input-group-text,.input-group-sm>.form-control-plaintext.form-control,.input-group-sm>.input-group-append>.form-control-plaintext.btn,.input-group-sm>.input-group-append>.form-control-plaintext.input-group-text,.input-group-sm>.input-group-prepend>.form-control-plaintext.btn,.input-group-sm>.input-group-prepend>.form-control-plaintext.input-group-text{padding-right:0;padding-left:0}.form-control-sm,.input-group-sm>.form-control,.input-group-sm>.input-group-append>.btn,.input-group-sm>.input-group-append>.input-group-text,.input-group-sm>.input-group-prepend>.btn,.input-group-sm>.input-group-prepend>.input-group-text{padding:.25rem .5rem;font-size:.875rem;line-height:1.5;border-radius:.2rem}.input-group-sm>.input-group-append>select.btn:not([size]):not([multiple]),.input-group-sm>.input-group-append>select.input-group-text:not([size]):not([multiple]),.input-group-sm>.input-group-prepend>select.btn:not([size]):not([multiple]),.input-group-sm>.input-group-prepend>select.input-group-text:not([size]):not([multiple]),.input-group-sm>select.form-control:not([size]):not([multiple]),select.form-control-sm:not([size]):not([multiple]){height:calc(1.8125rem + 2px)}.form-control-lg,.input-group-lg>.form-control,.input-group-lg>.input-group-append>.btn,.input-group-lg>.input-group-append>.input-group-text,.input-group-lg>.input-group-prepend>.btn,.input-group-lg>.input-group-prepend>.input-group-text{padding:.5rem 1rem;font-size:1.25rem;line-height:1.5;border-radius:.3rem}.input-group-lg>.input-group-append>select.btn:not([size]):not([multiple]),.input-group-lg>.input-group-append>select.input-group-text:not([size]):not([multiple]),.input-group-lg>.input-group-prepend>select.btn:not([size]):not([multiple]),.input-group-lg>.input-group-prepend>select.input-group-text:not([size]):not([multiple]),.input-group-lg>select.form-control:not([size]):not([multiple]),select.form-control-lg:not([size]):not([multiple]){height:calc(2.875rem + 2px)}.form-group{margin-bottom:1rem}.form-text{display:block;margin-top:.25rem}.form-row{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;margin-right:-5px;margin-left:-5px}.form-row>.col,.form-row>[class*=col-]{padding-right:5px;padding-left:5px}.form-check{position:relative;display:block;padding-left:1.25rem}.form-check-input{position:absolute;margin-top:.3rem;margin-left:-1.25rem}.form-check-input:disabled~.form-check-label{color:#6c757d}.form-check-label{margin-bottom:0}.form-check-inline{display:-ms-inline-flexbox;display:inline-flex;-ms-flex-align:center;align-items:center;padding-left:0;margin-right:.75rem}.form-check-inline .form-check-input{position:static;margin-top:0;margin-right:.3125rem;margin-left:0}.valid-feedback{display:none;width:100%;margin-top:.25rem;font-size:80%;color:#28a745}.valid-tooltip{position:absolute;top:100%;z-index:5;display:none;max-width:100%;padding:.5rem;margin-top:.1rem;font-size:.875rem;line-height:1;color:#fff;background-color:rgba(40,167,69,.8);border-radius:.2rem}.custom-select.is-valid,.form-control.is-valid,.was-validated .custom-select:valid,.was-validated .form-control:valid{border-color:#28a745}.custom-select.is-valid:focus,.form-control.is-valid:focus,.was-validated .custom-select:valid:focus,.was-validated .form-control:valid:focus{border-color:#28a745;box-shadow:0 0 0 .2rem rgba(40,167,69,.25)}.custom-select.is-valid~.valid-feedback,.custom-select.is-valid~.valid-tooltip,.form-control.is-valid~.valid-feedback,.form-control.is-valid~.valid-tooltip,.was-validated .custom-select:valid~.valid-feedback,.was-validated .custom-select:valid~.valid-tooltip,.was-validated .form-control:valid~.valid-feedback,.was-validated .form-control:valid~.valid-tooltip{display:block}.form-control-file.is-valid~.valid-feedback,.form-control-file.is-valid~.valid-tooltip,.was-validated .form-control-file:valid~.valid-feedback,.was-validated .form-control-file:valid~.valid-tooltip{display:block}.form-check-input.is-valid~.form-check-label,.was-validated .form-check-input:valid~.form-check-label{color:#28a745}.form-check-input.is-valid~.valid-feedback,.form-check-input.is-valid~.valid-tooltip,.was-validated .form-check-input:valid~.valid-feedback,.was-validated .form-check-input:valid~.valid-tooltip{display:block}.custom-control-input.is-valid~.custom-control-label,.was-validated .custom-control-input:valid~.custom-control-label{color:#28a745}.custom-control-input.is-valid~.custom-control-label::before,.was-validated .custom-control-input:valid~.custom-control-label::before{background-color:#71dd8a}.custom-control-input.is-valid~.valid-feedback,.custom-control-input.is-valid~.valid-tooltip,.was-validated .custom-control-input:valid~.valid-feedback,.was-validated .custom-control-input:valid~.valid-tooltip{display:block}.custom-control-input.is-valid:checked~.custom-control-label::before,.was-validated .custom-control-input:valid:checked~.custom-control-label::before{background-color:#34ce57}.custom-control-input.is-valid:focus~.custom-control-label::before,.was-validated .custom-control-input:valid:focus~.custom-control-label::before{box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(40,167,69,.25)}.custom-file-input.is-valid~.custom-file-label,.was-validated .custom-file-input:valid~.custom-file-label{border-color:#28a745}.custom-file-input.is-valid~.custom-file-label::before,.was-validated .custom-file-input:valid~.custom-file-label::before{border-color:inherit}.custom-file-input.is-valid~.valid-feedback,.custom-file-input.is-valid~.valid-tooltip,.was-validated .custom-file-input:valid~.valid-feedback,.was-validated .custom-file-input:valid~.valid-tooltip{display:block}.custom-file-input.is-valid:focus~.custom-file-label,.was-validated .custom-file-input:valid:focus~.custom-file-label{box-shadow:0 0 0 .2rem rgba(40,167,69,.25)}.invalid-feedback{display:none;width:100%;margin-top:.25rem;font-size:80%;color:#dc3545}.invalid-tooltip{position:absolute;top:100%;z-index:5;display:none;max-width:100%;padding:.5rem;margin-top:.1rem;font-size:.875rem;line-height:1;color:#fff;background-color:rgba(220,53,69,.8);border-radius:.2rem}.custom-select.is-invalid,.form-control.is-invalid,.was-validated .custom-select:invalid,.was-validated .form-control:invalid{border-color:#dc3545}.custom-select.is-invalid:focus,.form-control.is-invalid:focus,.was-validated .custom-select:invalid:focus,.was-validated .form-control:invalid:focus{border-color:#dc3545;box-shadow:0 0 0 .2rem rgba(220,53,69,.25)}.custom-select.is-invalid~.invalid-feedback,.custom-select.is-invalid~.invalid-tooltip,.form-control.is-invalid~.invalid-feedback,.form-control.is-invalid~.invalid-tooltip,.was-validated .custom-select:invalid~.invalid-feedback,.was-validated .custom-select:invalid~.invalid-tooltip,.was-validated .form-control:invalid~.invalid-feedback,.was-validated .form-control:invalid~.invalid-tooltip{display:block}.form-control-file.is-invalid~.invalid-feedback,.form-control-file.is-invalid~.invalid-tooltip,.was-validated .form-control-file:invalid~.invalid-feedback,.was-validated .form-control-file:invalid~.invalid-tooltip{display:block}.form-check-input.is-invalid~.form-check-label,.was-validated .form-check-input:invalid~.form-check-label{color:#dc3545}.form-check-input.is-invalid~.invalid-feedback,.form-check-input.is-invalid~.invalid-tooltip,.was-validated .form-check-input:invalid~.invalid-feedback,.was-validated .form-check-input:invalid~.invalid-tooltip{display:block}.custom-control-input.is-invalid~.custom-control-label,.was-validated .custom-control-input:invalid~.custom-control-label{color:#dc3545}.custom-control-input.is-invalid~.custom-control-label::before,.was-validated .custom-control-input:invalid~.custom-control-label::before{background-color:#efa2a9}.custom-control-input.is-invalid~.invalid-feedback,.custom-control-input.is-invalid~.invalid-tooltip,.was-validated .custom-control-input:invalid~.invalid-feedback,.was-validated .custom-control-input:invalid~.invalid-tooltip{display:block}.custom-control-input.is-invalid:checked~.custom-control-label::before,.was-validated .custom-control-input:invalid:checked~.custom-control-label::before{background-color:#e4606d}.custom-control-input.is-invalid:focus~.custom-control-label::before,.was-validated .custom-control-input:invalid:focus~.custom-control-label::before{box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(220,53,69,.25)}.custom-file-input.is-invalid~.custom-file-label,.was-validated .custom-file-input:invalid~.custom-file-label{border-color:#dc3545}.custom-file-input.is-invalid~.custom-file-label::before,.was-validated .custom-file-input:invalid~.custom-file-label::before{border-color:inherit}.custom-file-input.is-invalid~.invalid-feedback,.custom-file-input.is-invalid~.invalid-tooltip,.was-validated .custom-file-input:invalid~.invalid-feedback,.was-validated .custom-file-input:invalid~.invalid-tooltip{display:block}.custom-file-input.is-invalid:focus~.custom-file-label,.was-validated .custom-file-input:invalid:focus~.custom-file-label{box-shadow:0 0 0 .2rem rgba(220,53,69,.25)}.form-inline{display:-ms-flexbox;display:flex;-ms-flex-flow:row wrap;flex-flow:row wrap;-ms-flex-align:center;align-items:center}.form-inline .form-check{width:100%}@media (min-width:576px){.form-inline label{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;-ms-flex-pack:center;justify-content:center;margin-bottom:0}.form-inline .form-group{display:-ms-flexbox;display:flex;-ms-flex:0 0 auto;flex:0 0 auto;-ms-flex-flow:row wrap;flex-flow:row wrap;-ms-flex-align:center;align-items:center;margin-bottom:0}.form-inline .form-control{display:inline-block;width:auto;vertical-align:middle}.form-inline .form-control-plaintext{display:inline-block}.form-inline .custom-select,.form-inline .input-group{width:auto}.form-inline .form-check{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;-ms-flex-pack:center;justify-content:center;width:auto;padding-left:0}.form-inline .form-check-input{position:relative;margin-top:0;margin-right:.25rem;margin-left:0}.form-inline .custom-control{-ms-flex-align:center;align-items:center;-ms-flex-pack:center;justify-content:center}.form-inline .custom-control-label{margin-bottom:0}}.btn{display:inline-block;font-weight:400;text-align:center;white-space:nowrap;vertical-align:middle;-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none;border:1px solid transparent;padding:.375rem .75rem;font-size:1rem;line-height:1.5;border-radius:.25rem;transition:color .15s ease-in-out,background-color .15s ease-in-out,border-color .15s ease-in-out,box-shadow .15s ease-in-out}@media screen and (prefers-reduced-motion:reduce){.btn{transition:none}}.btn:focus,.btn:hover{text-decoration:none}.btn.focus,.btn:focus{outline:0;box-shadow:0 0 0 .2rem rgba(0,123,255,.25)}.btn.disabled,.btn:disabled{opacity:.65}.btn:not(:disabled):not(.disabled){cursor:pointer}.btn:not(:disabled):not(.disabled).active,.btn:not(:disabled):not(.disabled):active{background-image:none}a.btn.disabled,fieldset:disabled a.btn{pointer-events:none}.btn-primary{color:#fff;background-color:#007bff;border-color:#007bff}.btn-primary:hover{color:#fff;background-color:#0069d9;border-color:#0062cc}.btn-primary.focus,.btn-primary:focus{box-shadow:0 0 0 .2rem rgba(0,123,255,.5)}.btn-primary.disabled,.btn-primary:disabled{color:#fff;background-color:#007bff;border-color:#007bff}.btn-primary:not(:disabled):not(.disabled).active,.btn-primary:not(:disabled):not(.disabled):active,.show>.btn-primary.dropdown-toggle{color:#fff;background-color:#0062cc;border-color:#005cbf}.btn-primary:not(:disabled):not(.disabled).active:focus,.btn-primary:not(:disabled):not(.disabled):active:focus,.show>.btn-primary.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(0,123,255,.5)}.btn-secondary{color:#fff;background-color:#6c757d;border-color:#6c757d}.btn-secondary:hover{color:#fff;background-color:#5a6268;border-color:#545b62}.btn-secondary.focus,.btn-secondary:focus{box-shadow:0 0 0 .2rem rgba(108,117,125,.5)}.btn-secondary.disabled,.btn-secondary:disabled{color:#fff;background-color:#6c757d;border-color:#6c757d}.btn-secondary:not(:disabled):not(.disabled).active,.btn-secondary:not(:disabled):not(.disabled):active,.show>.btn-secondary.dropdown-toggle{color:#fff;background-color:#545b62;border-color:#4e555b}.btn-secondary:not(:disabled):not(.disabled).active:focus,.btn-secondary:not(:disabled):not(.disabled):active:focus,.show>.btn-secondary.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(108,117,125,.5)}.btn-success{color:#fff;background-color:#28a745;border-color:#28a745}.btn-success:hover{color:#fff;background-color:#218838;border-color:#1e7e34}.btn-success.focus,.btn-success:focus{box-shadow:0 0 0 .2rem rgba(40,167,69,.5)}.btn-success.disabled,.btn-success:disabled{color:#fff;background-color:#28a745;border-color:#28a745}.btn-success:not(:disabled):not(.disabled).active,.btn-success:not(:disabled):not(.disabled):active,.show>.btn-success.dropdown-toggle{color:#fff;background-color:#1e7e34;border-color:#1c7430}.btn-success:not(:disabled):not(.disabled).active:focus,.btn-success:not(:disabled):not(.disabled):active:focus,.show>.btn-success.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(40,167,69,.5)}.btn-info{color:#fff;background-color:#17a2b8;border-color:#17a2b8}.btn-info:hover{color:#fff;background-color:#138496;border-color:#117a8b}.btn-info.focus,.btn-info:focus{box-shadow:0 0 0 .2rem rgba(23,162,184,.5)}.btn-info.disabled,.btn-info:disabled{color:#fff;background-color:#17a2b8;border-color:#17a2b8}.btn-info:not(:disabled):not(.disabled).active,.btn-info:not(:disabled):not(.disabled):active,.show>.btn-info.dropdown-toggle{color:#fff;background-color:#117a8b;border-color:#10707f}.btn-info:not(:disabled):not(.disabled).active:focus,.btn-info:not(:disabled):not(.disabled):active:focus,.show>.btn-info.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(23,162,184,.5)}.btn-warning{color:#212529;background-color:#ffc107;border-color:#ffc107}.btn-warning:hover{color:#212529;background-color:#e0a800;border-color:#d39e00}.btn-warning.focus,.btn-warning:focus{box-shadow:0 0 0 .2rem rgba(255,193,7,.5)}.btn-warning.disabled,.btn-warning:disabled{color:#212529;background-color:#ffc107;border-color:#ffc107}.btn-warning:not(:disabled):not(.disabled).active,.btn-warning:not(:disabled):not(.disabled):active,.show>.btn-warning.dropdown-toggle{color:#212529;background-color:#d39e00;border-color:#c69500}.btn-warning:not(:disabled):not(.disabled).active:focus,.btn-warning:not(:disabled):not(.disabled):active:focus,.show>.btn-warning.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(255,193,7,.5)}.btn-danger{color:#fff;background-color:#dc3545;border-color:#dc3545}.btn-danger:hover{color:#fff;background-color:#c82333;border-color:#bd2130}.btn-danger.focus,.btn-danger:focus{box-shadow:0 0 0 .2rem rgba(220,53,69,.5)}.btn-danger.disabled,.btn-danger:disabled{color:#fff;background-color:#dc3545;border-color:#dc3545}.btn-danger:not(:disabled):not(.disabled).active,.btn-danger:not(:disabled):not(.disabled):active,.show>.btn-danger.dropdown-toggle{color:#fff;background-color:#bd2130;border-color:#b21f2d}.btn-danger:not(:disabled):not(.disabled).active:focus,.btn-danger:not(:disabled):not(.disabled):active:focus,.show>.btn-danger.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(220,53,69,.5)}.btn-light{color:#212529;background-color:#f8f9fa;border-color:#f8f9fa}.btn-light:hover{color:#212529;background-color:#e2e6ea;border-color:#dae0e5}.btn-light.focus,.btn-light:focus{box-shadow:0 0 0 .2rem rgba(248,249,250,.5)}.btn-light.disabled,.btn-light:disabled{color:#212529;background-color:#f8f9fa;border-color:#f8f9fa}.btn-light:not(:disabled):not(.disabled).active,.btn-light:not(:disabled):not(.disabled):active,.show>.btn-light.dropdown-toggle{color:#212529;background-color:#dae0e5;border-color:#d3d9df}.btn-light:not(:disabled):not(.disabled).active:focus,.btn-light:not(:disabled):not(.disabled):active:focus,.show>.btn-light.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(248,249,250,.5)}.btn-dark{color:#fff;background-color:#343a40;border-color:#343a40}.btn-dark:hover{color:#fff;background-color:#23272b;border-color:#1d2124}.btn-dark.focus,.btn-dark:focus{box-shadow:0 0 0 .2rem rgba(52,58,64,.5)}.btn-dark.disabled,.btn-dark:disabled{color:#fff;background-color:#343a40;border-color:#343a40}.btn-dark:not(:disabled):not(.disabled).active,.btn-dark:not(:disabled):not(.disabled):active,.show>.btn-dark.dropdown-toggle{color:#fff;background-color:#1d2124;border-color:#171a1d}.btn-dark:not(:disabled):not(.disabled).active:focus,.btn-dark:not(:disabled):not(.disabled):active:focus,.show>.btn-dark.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(52,58,64,.5)}.btn-outline-primary{color:#007bff;background-color:transparent;background-image:none;border-color:#007bff}.btn-outline-primary:hover{color:#fff;background-color:#007bff;border-color:#007bff}.btn-outline-primary.focus,.btn-outline-primary:focus{box-shadow:0 0 0 .2rem rgba(0,123,255,.5)}.btn-outline-primary.disabled,.btn-outline-primary:disabled{color:#007bff;background-color:transparent}.btn-outline-primary:not(:disabled):not(.disabled).active,.btn-outline-primary:not(:disabled):not(.disabled):active,.show>.btn-outline-primary.dropdown-toggle{color:#fff;background-color:#007bff;border-color:#007bff}.btn-outline-primary:not(:disabled):not(.disabled).active:focus,.btn-outline-primary:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-primary.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(0,123,255,.5)}.btn-outline-secondary{color:#6c757d;background-color:transparent;background-image:none;border-color:#6c757d}.btn-outline-secondary:hover{color:#fff;background-color:#6c757d;border-color:#6c757d}.btn-outline-secondary.focus,.btn-outline-secondary:focus{box-shadow:0 0 0 .2rem rgba(108,117,125,.5)}.btn-outline-secondary.disabled,.btn-outline-secondary:disabled{color:#6c757d;background-color:transparent}.btn-outline-secondary:not(:disabled):not(.disabled).active,.btn-outline-secondary:not(:disabled):not(.disabled):active,.show>.btn-outline-secondary.dropdown-toggle{color:#fff;background-color:#6c757d;border-color:#6c757d}.btn-outline-secondary:not(:disabled):not(.disabled).active:focus,.btn-outline-secondary:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-secondary.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(108,117,125,.5)}.btn-outline-success{color:#28a745;background-color:transparent;background-image:none;border-color:#28a745}.btn-outline-success:hover{color:#fff;background-color:#28a745;border-color:#28a745}.btn-outline-success.focus,.btn-outline-success:focus{box-shadow:0 0 0 .2rem rgba(40,167,69,.5)}.btn-outline-success.disabled,.btn-outline-success:disabled{color:#28a745;background-color:transparent}.btn-outline-success:not(:disabled):not(.disabled).active,.btn-outline-success:not(:disabled):not(.disabled):active,.show>.btn-outline-success.dropdown-toggle{color:#fff;background-color:#28a745;border-color:#28a745}.btn-outline-success:not(:disabled):not(.disabled).active:focus,.btn-outline-success:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-success.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(40,167,69,.5)}.btn-outline-info{color:#17a2b8;background-color:transparent;background-image:none;border-color:#17a2b8}.btn-outline-info:hover{color:#fff;background-color:#17a2b8;border-color:#17a2b8}.btn-outline-info.focus,.btn-outline-info:focus{box-shadow:0 0 0 .2rem rgba(23,162,184,.5)}.btn-outline-info.disabled,.btn-outline-info:disabled{color:#17a2b8;background-color:transparent}.btn-outline-info:not(:disabled):not(.disabled).active,.btn-outline-info:not(:disabled):not(.disabled):active,.show>.btn-outline-info.dropdown-toggle{color:#fff;background-color:#17a2b8;border-color:#17a2b8}.btn-outline-info:not(:disabled):not(.disabled).active:focus,.btn-outline-info:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-info.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(23,162,184,.5)}.btn-outline-warning{color:#ffc107;background-color:transparent;background-image:none;border-color:#ffc107}.btn-outline-warning:hover{color:#212529;background-color:#ffc107;border-color:#ffc107}.btn-outline-warning.focus,.btn-outline-warning:focus{box-shadow:0 0 0 .2rem rgba(255,193,7,.5)}.btn-outline-warning.disabled,.btn-outline-warning:disabled{color:#ffc107;background-color:transparent}.btn-outline-warning:not(:disabled):not(.disabled).active,.btn-outline-warning:not(:disabled):not(.disabled):active,.show>.btn-outline-warning.dropdown-toggle{color:#212529;background-color:#ffc107;border-color:#ffc107}.btn-outline-warning:not(:disabled):not(.disabled).active:focus,.btn-outline-warning:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-warning.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(255,193,7,.5)}.btn-outline-danger{color:#dc3545;background-color:transparent;background-image:none;border-color:#dc3545}.btn-outline-danger:hover{color:#fff;background-color:#dc3545;border-color:#dc3545}.btn-outline-danger.focus,.btn-outline-danger:focus{box-shadow:0 0 0 .2rem rgba(220,53,69,.5)}.btn-outline-danger.disabled,.btn-outline-danger:disabled{color:#dc3545;background-color:transparent}.btn-outline-danger:not(:disabled):not(.disabled).active,.btn-outline-danger:not(:disabled):not(.disabled):active,.show>.btn-outline-danger.dropdown-toggle{color:#fff;background-color:#dc3545;border-color:#dc3545}.btn-outline-danger:not(:disabled):not(.disabled).active:focus,.btn-outline-danger:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-danger.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(220,53,69,.5)}.btn-outline-light{color:#f8f9fa;background-color:transparent;background-image:none;border-color:#f8f9fa}.btn-outline-light:hover{color:#212529;background-color:#f8f9fa;border-color:#f8f9fa}.btn-outline-light.focus,.btn-outline-light:focus{box-shadow:0 0 0 .2rem rgba(248,249,250,.5)}.btn-outline-light.disabled,.btn-outline-light:disabled{color:#f8f9fa;background-color:transparent}.btn-outline-light:not(:disabled):not(.disabled).active,.btn-outline-light:not(:disabled):not(.disabled):active,.show>.btn-outline-light.dropdown-toggle{color:#212529;background-color:#f8f9fa;border-color:#f8f9fa}.btn-outline-light:not(:disabled):not(.disabled).active:focus,.btn-outline-light:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-light.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(248,249,250,.5)}.btn-outline-dark{color:#343a40;background-color:transparent;background-image:none;border-color:#343a40}.btn-outline-dark:hover{color:#fff;background-color:#343a40;border-color:#343a40}.btn-outline-dark.focus,.btn-outline-dark:focus{box-shadow:0 0 0 .2rem rgba(52,58,64,.5)}.btn-outline-dark.disabled,.btn-outline-dark:disabled{color:#343a40;background-color:transparent}.btn-outline-dark:not(:disabled):not(.disabled).active,.btn-outline-dark:not(:disabled):not(.disabled):active,.show>.btn-outline-dark.dropdown-toggle{color:#fff;background-color:#343a40;border-color:#343a40}.btn-outline-dark:not(:disabled):not(.disabled).active:focus,.btn-outline-dark:not(:disabled):not(.disabled):active:focus,.show>.btn-outline-dark.dropdown-toggle:focus{box-shadow:0 0 0 .2rem rgba(52,58,64,.5)}.btn-link{font-weight:400;color:#007bff;background-color:transparent}.btn-link:hover{color:#0056b3;text-decoration:underline;background-color:transparent;border-color:transparent}.btn-link.focus,.btn-link:focus{text-decoration:underline;border-color:transparent;box-shadow:none}.btn-link.disabled,.btn-link:disabled{color:#6c757d;pointer-events:none}.btn-group-lg>.btn,.btn-lg{padding:.5rem 1rem;font-size:1.25rem;line-height:1.5;border-radius:.3rem}.btn-group-sm>.btn,.btn-sm{padding:.25rem .5rem;font-size:.875rem;line-height:1.5;border-radius:.2rem}.btn-block{display:block;width:100%}.btn-block+.btn-block{margin-top:.5rem}input[type=button].btn-block,input[type=reset].btn-block,input[type=submit].btn-block{width:100%}.fade{transition:opacity .15s linear}@media screen and (prefers-reduced-motion:reduce){.fade{transition:none}}.fade:not(.show){opacity:0}.collapse:not(.show){display:none}.collapsing{position:relative;height:0;overflow:hidden;transition:height .35s ease}@media screen and (prefers-reduced-motion:reduce){.collapsing{transition:none}}.dropdown,.dropleft,.dropright,.dropup{position:relative}.dropdown-toggle::after{display:inline-block;width:0;height:0;margin-left:.255em;vertical-align:.255em;content:"";border-top:.3em solid;border-right:.3em solid transparent;border-bottom:0;border-left:.3em solid transparent}.dropdown-toggle:empty::after{margin-left:0}.dropdown-menu{position:absolute;top:100%;left:0;z-index:1000;display:none;float:left;min-width:10rem;padding:.5rem 0;margin:.125rem 0 0;font-size:1rem;color:#212529;text-align:left;list-style:none;background-color:#fff;background-clip:padding-box;border:1px solid rgba(0,0,0,.15);border-radius:.25rem}.dropdown-menu-right{right:0;left:auto}.dropup .dropdown-menu{top:auto;bottom:100%;margin-top:0;margin-bottom:.125rem}.dropup .dropdown-toggle::after{display:inline-block;width:0;height:0;margin-left:.255em;vertical-align:.255em;content:"";border-top:0;border-right:.3em solid transparent;border-bottom:.3em solid;border-left:.3em solid transparent}.dropup .dropdown-toggle:empty::after{margin-left:0}.dropright .dropdown-menu{top:0;right:auto;left:100%;margin-top:0;margin-left:.125rem}.dropright .dropdown-toggle::after{display:inline-block;width:0;height:0;margin-left:.255em;vertical-align:.255em;content:"";border-top:.3em solid transparent;border-right:0;border-bottom:.3em solid transparent;border-left:.3em solid}.dropright .dropdown-toggle:empty::after{margin-left:0}.dropright .dropdown-toggle::after{vertical-align:0}.dropleft .dropdown-menu{top:0;right:100%;left:auto;margin-top:0;margin-right:.125rem}.dropleft .dropdown-toggle::after{display:inline-block;width:0;height:0;margin-left:.255em;vertical-align:.255em;content:""}.dropleft .dropdown-toggle::after{display:none}.dropleft .dropdown-toggle::before{display:inline-block;width:0;height:0;margin-right:.255em;vertical-align:.255em;content:"";border-top:.3em solid transparent;border-right:.3em solid;border-bottom:.3em solid transparent}.dropleft .dropdown-toggle:empty::after{margin-left:0}.dropleft .dropdown-toggle::before{vertical-align:0}.dropdown-menu[x-placement^=bottom],.dropdown-menu[x-placement^=left],.dropdown-menu[x-placement^=right],.dropdown-menu[x-placement^=top]{right:auto;bottom:auto}.dropdown-divider{height:0;margin:.5rem 0;overflow:hidden;border-top:1px solid #e9ecef}.dropdown-item{display:block;width:100%;padding:.25rem 1.5rem;clear:both;font-weight:400;color:#212529;text-align:inherit;white-space:nowrap;background-color:transparent;border:0}.dropdown-item:focus,.dropdown-item:hover{color:#16181b;text-decoration:none;background-color:#f8f9fa}.dropdown-item.active,.dropdown-item:active{color:#fff;text-decoration:none;background-color:#007bff}.dropdown-item.disabled,.dropdown-item:disabled{color:#6c757d;background-color:transparent}.dropdown-menu.show{display:block}.dropdown-header{display:block;padding:.5rem 1.5rem;margin-bottom:0;font-size:.875rem;color:#6c757d;white-space:nowrap}.dropdown-item-text{display:block;padding:.25rem 1.5rem;color:#212529}.btn-group,.btn-group-vertical{position:relative;display:-ms-inline-flexbox;display:inline-flex;vertical-align:middle}.btn-group-vertical>.btn,.btn-group>.btn{position:relative;-ms-flex:0 1 auto;flex:0 1 auto}.btn-group-vertical>.btn:hover,.btn-group>.btn:hover{z-index:1}.btn-group-vertical>.btn.active,.btn-group-vertical>.btn:active,.btn-group-vertical>.btn:focus,.btn-group>.btn.active,.btn-group>.btn:active,.btn-group>.btn:focus{z-index:1}.btn-group .btn+.btn,.btn-group .btn+.btn-group,.btn-group .btn-group+.btn,.btn-group .btn-group+.btn-group,.btn-group-vertical .btn+.btn,.btn-group-vertical .btn+.btn-group,.btn-group-vertical .btn-group+.btn,.btn-group-vertical .btn-group+.btn-group{margin-left:-1px}.btn-toolbar{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;-ms-flex-pack:start;justify-content:flex-start}.btn-toolbar .input-group{width:auto}.btn-group>.btn:first-child{margin-left:0}.btn-group>.btn-group:not(:last-child)>.btn,.btn-group>.btn:not(:last-child):not(.dropdown-toggle){border-top-right-radius:0;border-bottom-right-radius:0}.btn-group>.btn-group:not(:first-child)>.btn,.btn-group>.btn:not(:first-child){border-top-left-radius:0;border-bottom-left-radius:0}.dropdown-toggle-split{padding-right:.5625rem;padding-left:.5625rem}.dropdown-toggle-split::after,.dropright .dropdown-toggle-split::after,.dropup .dropdown-toggle-split::after{margin-left:0}.dropleft .dropdown-toggle-split::before{margin-right:0}.btn-group-sm>.btn+.dropdown-toggle-split,.btn-sm+.dropdown-toggle-split{padding-right:.375rem;padding-left:.375rem}.btn-group-lg>.btn+.dropdown-toggle-split,.btn-lg+.dropdown-toggle-split{padding-right:.75rem;padding-left:.75rem}.btn-group-vertical{-ms-flex-direction:column;flex-direction:column;-ms-flex-align:start;align-items:flex-start;-ms-flex-pack:center;justify-content:center}.btn-group-vertical .btn,.btn-group-vertical .btn-group{width:100%}.btn-group-vertical>.btn+.btn,.btn-group-vertical>.btn+.btn-group,.btn-group-vertical>.btn-group+.btn,.btn-group-vertical>.btn-group+.btn-group{margin-top:-1px;margin-left:0}.btn-group-vertical>.btn-group:not(:last-child)>.btn,.btn-group-vertical>.btn:not(:last-child):not(.dropdown-toggle){border-bottom-right-radius:0;border-bottom-left-radius:0}.btn-group-vertical>.btn-group:not(:first-child)>.btn,.btn-group-vertical>.btn:not(:first-child){border-top-left-radius:0;border-top-right-radius:0}.btn-group-toggle>.btn,.btn-group-toggle>.btn-group>.btn{margin-bottom:0}.btn-group-toggle>.btn input[type=checkbox],.btn-group-toggle>.btn input[type=radio],.btn-group-toggle>.btn-group>.btn input[type=checkbox],.btn-group-toggle>.btn-group>.btn input[type=radio]{position:absolute;clip:rect(0,0,0,0);pointer-events:none}.input-group{position:relative;display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;-ms-flex-align:stretch;align-items:stretch;width:100%}.input-group>.custom-file,.input-group>.custom-select,.input-group>.form-control{position:relative;-ms-flex:1 1 auto;flex:1 1 auto;width:1%;margin-bottom:0}.input-group>.custom-file:focus,.input-group>.custom-select:focus,.input-group>.form-control:focus{z-index:3}.input-group>.custom-file+.custom-file,.input-group>.custom-file+.custom-select,.input-group>.custom-file+.form-control,.input-group>.custom-select+.custom-file,.input-group>.custom-select+.custom-select,.input-group>.custom-select+.form-control,.input-group>.form-control+.custom-file,.input-group>.form-control+.custom-select,.input-group>.form-control+.form-control{margin-left:-1px}.input-group>.custom-select:not(:last-child),.input-group>.form-control:not(:last-child){border-top-right-radius:0;border-bottom-right-radius:0}.input-group>.custom-select:not(:first-child),.input-group>.form-control:not(:first-child){border-top-left-radius:0;border-bottom-left-radius:0}.input-group>.custom-file{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center}.input-group>.custom-file:not(:last-child) .custom-file-label,.input-group>.custom-file:not(:last-child) .custom-file-label::after{border-top-right-radius:0;border-bottom-right-radius:0}.input-group>.custom-file:not(:first-child) .custom-file-label{border-top-left-radius:0;border-bottom-left-radius:0}.input-group-append,.input-group-prepend{display:-ms-flexbox;display:flex}.input-group-append .btn,.input-group-prepend .btn{position:relative;z-index:2}.input-group-append .btn+.btn,.input-group-append .btn+.input-group-text,.input-group-append .input-group-text+.btn,.input-group-append .input-group-text+.input-group-text,.input-group-prepend .btn+.btn,.input-group-prepend .btn+.input-group-text,.input-group-prepend .input-group-text+.btn,.input-group-prepend .input-group-text+.input-group-text{margin-left:-1px}.input-group-prepend{margin-right:-1px}.input-group-append{margin-left:-1px}.input-group-text{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;padding:.375rem .75rem;margin-bottom:0;font-size:1rem;font-weight:400;line-height:1.5;color:#495057;text-align:center;white-space:nowrap;background-color:#e9ecef;border:1px solid #ced4da;border-radius:.25rem}.input-group-text input[type=checkbox],.input-group-text input[type=radio]{margin-top:0}.input-group>.input-group-append:last-child>.btn:not(:last-child):not(.dropdown-toggle),.input-group>.input-group-append:last-child>.input-group-text:not(:last-child),.input-group>.input-group-append:not(:last-child)>.btn,.input-group>.input-group-append:not(:last-child)>.input-group-text,.input-group>.input-group-prepend>.btn,.input-group>.input-group-prepend>.input-group-text{border-top-right-radius:0;border-bottom-right-radius:0}.input-group>.input-group-append>.btn,.input-group>.input-group-append>.input-group-text,.input-group>.input-group-prepend:first-child>.btn:not(:first-child),.input-group>.input-group-prepend:first-child>.input-group-text:not(:first-child),.input-group>.input-group-prepend:not(:first-child)>.btn,.input-group>.input-group-prepend:not(:first-child)>.input-group-text{border-top-left-radius:0;border-bottom-left-radius:0}.custom-control{position:relative;display:block;min-height:1.5rem;padding-left:1.5rem}.custom-control-inline{display:-ms-inline-flexbox;display:inline-flex;margin-right:1rem}.custom-control-input{position:absolute;z-index:-1;opacity:0}.custom-control-input:checked~.custom-control-label::before{color:#fff;background-color:#007bff}.custom-control-input:focus~.custom-control-label::before{box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(0,123,255,.25)}.custom-control-input:active~.custom-control-label::before{color:#fff;background-color:#b3d7ff}.custom-control-input:disabled~.custom-control-label{color:#6c757d}.custom-control-input:disabled~.custom-control-label::before{background-color:#e9ecef}.custom-control-label{position:relative;margin-bottom:0}.custom-control-label::before{position:absolute;top:.25rem;left:-1.5rem;display:block;width:1rem;height:1rem;pointer-events:none;content:"";-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none;background-color:#dee2e6}.custom-control-label::after{position:absolute;top:.25rem;left:-1.5rem;display:block;width:1rem;height:1rem;content:"";background-repeat:no-repeat;background-position:center center;background-size:50% 50%}.custom-checkbox .custom-control-label::before{border-radius:.25rem}.custom-checkbox .custom-control-input:checked~.custom-control-label::before{background-color:#007bff}.custom-checkbox .custom-control-input:checked~.custom-control-label::after{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 8 8'%3E%3Cpath fill='%23fff' d='M6.564.75l-3.59 3.612-1.538-1.55L0 4.26 2.974 7.25 8 2.193z'/%3E%3C/svg%3E")}.custom-checkbox .custom-control-input:indeterminate~.custom-control-label::before{background-color:#007bff}.custom-checkbox .custom-control-input:indeterminate~.custom-control-label::after{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 4 4'%3E%3Cpath stroke='%23fff' d='M0 2h4'/%3E%3C/svg%3E")}.custom-checkbox .custom-control-input:disabled:checked~.custom-control-label::before{background-color:rgba(0,123,255,.5)}.custom-checkbox .custom-control-input:disabled:indeterminate~.custom-control-label::before{background-color:rgba(0,123,255,.5)}.custom-radio .custom-control-label::before{border-radius:50%}.custom-radio .custom-control-input:checked~.custom-control-label::before{background-color:#007bff}.custom-radio .custom-control-input:checked~.custom-control-label::after{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='-4 -4 8 8'%3E%3Ccircle r='3' fill='%23fff'/%3E%3C/svg%3E")}.custom-radio .custom-control-input:disabled:checked~.custom-control-label::before{background-color:rgba(0,123,255,.5)}.custom-select{display:inline-block;width:100%;height:calc(2.25rem + 2px);padding:.375rem 1.75rem .375rem .75rem;line-height:1.5;color:#495057;vertical-align:middle;background:#fff url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 4 5'%3E%3Cpath fill='%23343a40' d='M2 0L0 2h4zm0 5L0 3h4z'/%3E%3C/svg%3E") no-repeat right .75rem center;background-size:8px 10px;border:1px solid #ced4da;border-radius:.25rem;-webkit-appearance:none;-moz-appearance:none;appearance:none}.custom-select:focus{border-color:#80bdff;outline:0;box-shadow:inset 0 1px 2px rgba(0,0,0,.075),0 0 5px rgba(128,189,255,.5)}.custom-select:focus::-ms-value{color:#495057;background-color:#fff}.custom-select[multiple],.custom-select[size]:not([size="1"]){height:auto;padding-right:.75rem;background-image:none}.custom-select:disabled{color:#6c757d;background-color:#e9ecef}.custom-select::-ms-expand{opacity:0}.custom-select-sm{height:calc(1.8125rem + 2px);padding-top:.375rem;padding-bottom:.375rem;font-size:75%}.custom-select-lg{height:calc(2.875rem + 2px);padding-top:.375rem;padding-bottom:.375rem;font-size:125%}.custom-file{position:relative;display:inline-block;width:100%;height:calc(2.25rem + 2px);margin-bottom:0}.custom-file-input{position:relative;z-index:2;width:100%;height:calc(2.25rem + 2px);margin:0;opacity:0}.custom-file-input:focus~.custom-file-label{border-color:#80bdff;box-shadow:0 0 0 .2rem rgba(0,123,255,.25)}.custom-file-input:focus~.custom-file-label::after{border-color:#80bdff}.custom-file-input:lang(en)~.custom-file-label::after{content:"Browse"}.custom-file-label{position:absolute;top:0;right:0;left:0;z-index:1;height:calc(2.25rem + 2px);padding:.375rem .75rem;line-height:1.5;color:#495057;background-color:#fff;border:1px solid #ced4da;border-radius:.25rem}.custom-file-label::after{position:absolute;top:0;right:0;bottom:0;z-index:3;display:block;height:2.25rem;padding:.375rem .75rem;line-height:1.5;color:#495057;content:"Browse";background-color:#e9ecef;border-left:1px solid #ced4da;border-radius:0 .25rem .25rem 0}.custom-range{width:100%;padding-left:0;background-color:transparent;-webkit-appearance:none;-moz-appearance:none;appearance:none}.custom-range:focus{outline:0}.custom-range::-moz-focus-outer{border:0}.custom-range::-webkit-slider-thumb{width:1rem;height:1rem;margin-top:-.25rem;background-color:#007bff;border:0;border-radius:1rem;-webkit-appearance:none;appearance:none}.custom-range::-webkit-slider-thumb:focus{outline:0;box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(0,123,255,.25)}.custom-range::-webkit-slider-thumb:active{background-color:#b3d7ff}.custom-range::-webkit-slider-runnable-track{width:100%;height:.5rem;color:transparent;cursor:pointer;background-color:#dee2e6;border-color:transparent;border-radius:1rem}.custom-range::-moz-range-thumb{width:1rem;height:1rem;background-color:#007bff;border:0;border-radius:1rem;-moz-appearance:none;appearance:none}.custom-range::-moz-range-thumb:focus{outline:0;box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(0,123,255,.25)}.custom-range::-moz-range-thumb:active{background-color:#b3d7ff}.custom-range::-moz-range-track{width:100%;height:.5rem;color:transparent;cursor:pointer;background-color:#dee2e6;border-color:transparent;border-radius:1rem}.custom-range::-ms-thumb{width:1rem;height:1rem;background-color:#007bff;border:0;border-radius:1rem;appearance:none}.custom-range::-ms-thumb:focus{outline:0;box-shadow:0 0 0 1px #fff,0 0 0 .2rem rgba(0,123,255,.25)}.custom-range::-ms-thumb:active{background-color:#b3d7ff}.custom-range::-ms-track{width:100%;height:.5rem;color:transparent;cursor:pointer;background-color:transparent;border-color:transparent;border-width:.5rem}.custom-range::-ms-fill-lower{background-color:#dee2e6;border-radius:1rem}.custom-range::-ms-fill-upper{margin-right:15px;background-color:#dee2e6;border-radius:1rem}.nav{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;padding-left:0;margin-bottom:0;list-style:none}.nav-link{display:block;padding:.5rem 1rem}.nav-link:focus,.nav-link:hover{text-decoration:none}.nav-link.disabled{color:#6c757d}.nav-tabs{border-bottom:1px solid #dee2e6}.nav-tabs .nav-item{margin-bottom:-1px}.nav-tabs .nav-link{border:1px solid transparent;border-top-left-radius:.25rem;border-top-right-radius:.25rem}.nav-tabs .nav-link:focus,.nav-tabs .nav-link:hover{border-color:#e9ecef #e9ecef #dee2e6}.nav-tabs .nav-link.disabled{color:#6c757d;background-color:transparent;border-color:transparent}.nav-tabs .nav-item.show .nav-link,.nav-tabs .nav-link.active{color:#495057;background-color:#fff;border-color:#dee2e6 #dee2e6 #fff}.nav-tabs .dropdown-menu{margin-top:-1px;border-top-left-radius:0;border-top-right-radius:0}.nav-pills .nav-link{border-radius:.25rem}.nav-pills .nav-link.active,.nav-pills .show>.nav-link{color:#fff;background-color:#007bff}.nav-fill .nav-item{-ms-flex:1 1 auto;flex:1 1 auto;text-align:center}.nav-justified .nav-item{-ms-flex-preferred-size:0;flex-basis:0;-ms-flex-positive:1;flex-grow:1;text-align:center}.tab-content>.tab-pane{display:none}.tab-content>.active{display:block}.navbar{position:relative;display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;-ms-flex-align:center;align-items:center;-ms-flex-pack:justify;justify-content:space-between;padding:.5rem 1rem}.navbar>.container,.navbar>.container-fluid{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;-ms-flex-align:center;align-items:center;-ms-flex-pack:justify;justify-content:space-between}.navbar-brand{display:inline-block;padding-top:.3125rem;padding-bottom:.3125rem;margin-right:1rem;font-size:1.25rem;line-height:inherit;white-space:nowrap}.navbar-brand:focus,.navbar-brand:hover{text-decoration:none}.navbar-nav{display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column;padding-left:0;margin-bottom:0;list-style:none}.navbar-nav .nav-link{padding-right:0;padding-left:0}.navbar-nav .dropdown-menu{position:static;float:none}.navbar-text{display:inline-block;padding-top:.5rem;padding-bottom:.5rem}.navbar-collapse{-ms-flex-preferred-size:100%;flex-basis:100%;-ms-flex-positive:1;flex-grow:1;-ms-flex-align:center;align-items:center}.navbar-toggler{padding:.25rem .75rem;font-size:1.25rem;line-height:1;background-color:transparent;border:1px solid transparent;border-radius:.25rem}.navbar-toggler:focus,.navbar-toggler:hover{text-decoration:none}.navbar-toggler:not(:disabled):not(.disabled){cursor:pointer}.navbar-toggler-icon{display:inline-block;width:1.5em;height:1.5em;vertical-align:middle;content:"";background:no-repeat center center;background-size:100% 100%}@media (max-width:575.98px){.navbar-expand-sm>.container,.navbar-expand-sm>.container-fluid{padding-right:0;padding-left:0}}@media (min-width:576px){.navbar-expand-sm{-ms-flex-flow:row nowrap;flex-flow:row nowrap;-ms-flex-pack:start;justify-content:flex-start}.navbar-expand-sm .navbar-nav{-ms-flex-direction:row;flex-direction:row}.navbar-expand-sm .navbar-nav .dropdown-menu{position:absolute}.navbar-expand-sm .navbar-nav .nav-link{padding-right:.5rem;padding-left:.5rem}.navbar-expand-sm>.container,.navbar-expand-sm>.container-fluid{-ms-flex-wrap:nowrap;flex-wrap:nowrap}.navbar-expand-sm .navbar-collapse{display:-ms-flexbox!important;display:flex!important;-ms-flex-preferred-size:auto;flex-basis:auto}.navbar-expand-sm .navbar-toggler{display:none}}@media (max-width:767.98px){.navbar-expand-md>.container,.navbar-expand-md>.container-fluid{padding-right:0;padding-left:0}}@media (min-width:768px){.navbar-expand-md{-ms-flex-flow:row nowrap;flex-flow:row nowrap;-ms-flex-pack:start;justify-content:flex-start}.navbar-expand-md .navbar-nav{-ms-flex-direction:row;flex-direction:row}.navbar-expand-md .navbar-nav .dropdown-menu{position:absolute}.navbar-expand-md .navbar-nav .nav-link{padding-right:.5rem;padding-left:.5rem}.navbar-expand-md>.container,.navbar-expand-md>.container-fluid{-ms-flex-wrap:nowrap;flex-wrap:nowrap}.navbar-expand-md .navbar-collapse{display:-ms-flexbox!important;display:flex!important;-ms-flex-preferred-size:auto;flex-basis:auto}.navbar-expand-md .navbar-toggler{display:none}}@media (max-width:991.98px){.navbar-expand-lg>.container,.navbar-expand-lg>.container-fluid{padding-right:0;padding-left:0}}@media (min-width:992px){.navbar-expand-lg{-ms-flex-flow:row nowrap;flex-flow:row nowrap;-ms-flex-pack:start;justify-content:flex-start}.navbar-expand-lg .navbar-nav{-ms-flex-direction:row;flex-direction:row}.navbar-expand-lg .navbar-nav .dropdown-menu{position:absolute}.navbar-expand-lg .navbar-nav .nav-link{padding-right:.5rem;padding-left:.5rem}.navbar-expand-lg>.container,.navbar-expand-lg>.container-fluid{-ms-flex-wrap:nowrap;flex-wrap:nowrap}.navbar-expand-lg .navbar-collapse{display:-ms-flexbox!important;display:flex!important;-ms-flex-preferred-size:auto;flex-basis:auto}.navbar-expand-lg .navbar-toggler{display:none}}@media (max-width:1199.98px){.navbar-expand-xl>.container,.navbar-expand-xl>.container-fluid{padding-right:0;padding-left:0}}@media (min-width:1200px){.navbar-expand-xl{-ms-flex-flow:row nowrap;flex-flow:row nowrap;-ms-flex-pack:start;justify-content:flex-start}.navbar-expand-xl .navbar-nav{-ms-flex-direction:row;flex-direction:row}.navbar-expand-xl .navbar-nav .dropdown-menu{position:absolute}.navbar-expand-xl .navbar-nav .nav-link{padding-right:.5rem;padding-left:.5rem}.navbar-expand-xl>.container,.navbar-expand-xl>.container-fluid{-ms-flex-wrap:nowrap;flex-wrap:nowrap}.navbar-expand-xl .navbar-collapse{display:-ms-flexbox!important;display:flex!important;-ms-flex-preferred-size:auto;flex-basis:auto}.navbar-expand-xl .navbar-toggler{display:none}}.navbar-expand{-ms-flex-flow:row nowrap;flex-flow:row nowrap;-ms-flex-pack:start;justify-content:flex-start}.navbar-expand>.container,.navbar-expand>.container-fluid{padding-right:0;padding-left:0}.navbar-expand .navbar-nav{-ms-flex-direction:row;flex-direction:row}.navbar-expand .navbar-nav .dropdown-menu{position:absolute}.navbar-expand .navbar-nav .nav-link{padding-right:.5rem;padding-left:.5rem}.navbar-expand>.container,.navbar-expand>.container-fluid{-ms-flex-wrap:nowrap;flex-wrap:nowrap}.navbar-expand .navbar-collapse{display:-ms-flexbox!important;display:flex!important;-ms-flex-preferred-size:auto;flex-basis:auto}.navbar-expand .navbar-toggler{display:none}.navbar-light .navbar-brand{color:rgba(0,0,0,.9)}.navbar-light .navbar-brand:focus,.navbar-light .navbar-brand:hover{color:rgba(0,0,0,.9)}.navbar-light .navbar-nav .nav-link{color:rgba(0,0,0,.5)}.navbar-light .navbar-nav .nav-link:focus,.navbar-light .navbar-nav .nav-link:hover{color:rgba(0,0,0,.7)}.navbar-light .navbar-nav .nav-link.disabled{color:rgba(0,0,0,.3)}.navbar-light .navbar-nav .active>.nav-link,.navbar-light .navbar-nav .nav-link.active,.navbar-light .navbar-nav .nav-link.show,.navbar-light .navbar-nav .show>.nav-link{color:rgba(0,0,0,.9)}.navbar-light .navbar-toggler{color:rgba(0,0,0,.5);border-color:rgba(0,0,0,.1)}.navbar-light .navbar-toggler-icon{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg viewBox='0 0 30 30' xmlns='http://www.w3.org/2000/svg'%3E%3Cpath stroke='rgba(0, 0, 0, 0.5)' stroke-width='2' stroke-linecap='round' stroke-miterlimit='10' d='M4 7h22M4 15h22M4 23h22'/%3E%3C/svg%3E")}.navbar-light .navbar-text{color:rgba(0,0,0,.5)}.navbar-light .navbar-text a{color:rgba(0,0,0,.9)}.navbar-light .navbar-text a:focus,.navbar-light .navbar-text a:hover{color:rgba(0,0,0,.9)}.navbar-dark .navbar-brand{color:#fff}.navbar-dark .navbar-brand:focus,.navbar-dark .navbar-brand:hover{color:#fff}.navbar-dark .navbar-nav .nav-link{color:rgba(255,255,255,.5)}.navbar-dark .navbar-nav .nav-link:focus,.navbar-dark .navbar-nav .nav-link:hover{color:rgba(255,255,255,.75)}.navbar-dark .navbar-nav .nav-link.disabled{color:rgba(255,255,255,.25)}.navbar-dark .navbar-nav .active>.nav-link,.navbar-dark .navbar-nav .nav-link.active,.navbar-dark .navbar-nav .nav-link.show,.navbar-dark .navbar-nav .show>.nav-link{color:#fff}.navbar-dark .navbar-toggler{color:rgba(255,255,255,.5);border-color:rgba(255,255,255,.1)}.navbar-dark .navbar-toggler-icon{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg viewBox='0 0 30 30' xmlns='http://www.w3.org/2000/svg'%3E%3Cpath stroke='rgba(255, 255, 255, 0.5)' stroke-width='2' stroke-linecap='round' stroke-miterlimit='10' d='M4 7h22M4 15h22M4 23h22'/%3E%3C/svg%3E")}.navbar-dark .navbar-text{color:rgba(255,255,255,.5)}.navbar-dark .navbar-text a{color:#fff}.navbar-dark .navbar-text a:focus,.navbar-dark .navbar-text a:hover{color:#fff}.card{position:relative;display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column;min-width:0;word-wrap:break-word;background-color:#fff;background-clip:border-box;border:1px solid rgba(0,0,0,.125);border-radius:.25rem}.card>hr{margin-right:0;margin-left:0}.card>.list-group:first-child .list-group-item:first-child{border-top-left-radius:.25rem;border-top-right-radius:.25rem}.card>.list-group:last-child .list-group-item:last-child{border-bottom-right-radius:.25rem;border-bottom-left-radius:.25rem}.card-body{-ms-flex:1 1 auto;flex:1 1 auto;padding:1.25rem}.card-title{margin-bottom:.75rem}.card-subtitle{margin-top:-.375rem;margin-bottom:0}.card-text:last-child{margin-bottom:0}.card-link:hover{text-decoration:none}.card-link+.card-link{margin-left:1.25rem}.card-header{padding:.75rem 1.25rem;margin-bottom:0;background-color:rgba(0,0,0,.03);border-bottom:1px solid rgba(0,0,0,.125)}.card-header:first-child{border-radius:calc(.25rem - 1px) calc(.25rem - 1px) 0 0}.card-header+.list-group .list-group-item:first-child{border-top:0}.card-footer{padding:.75rem 1.25rem;background-color:rgba(0,0,0,.03);border-top:1px solid rgba(0,0,0,.125)}.card-footer:last-child{border-radius:0 0 calc(.25rem - 1px) calc(.25rem - 1px)}.card-header-tabs{margin-right:-.625rem;margin-bottom:-.75rem;margin-left:-.625rem;border-bottom:0}.card-header-pills{margin-right:-.625rem;margin-left:-.625rem}.card-img-overlay{position:absolute;top:0;right:0;bottom:0;left:0;padding:1.25rem}.card-img{width:100%;border-radius:calc(.25rem - 1px)}.card-img-top{width:100%;border-top-left-radius:calc(.25rem - 1px);border-top-right-radius:calc(.25rem - 1px)}.card-img-bottom{width:100%;border-bottom-right-radius:calc(.25rem - 1px);border-bottom-left-radius:calc(.25rem - 1px)}.card-deck{display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column}.card-deck .card{margin-bottom:15px}@media (min-width:576px){.card-deck{-ms-flex-flow:row wrap;flex-flow:row wrap;margin-right:-15px;margin-left:-15px}.card-deck .card{display:-ms-flexbox;display:flex;-ms-flex:1 0 0%;flex:1 0 0%;-ms-flex-direction:column;flex-direction:column;margin-right:15px;margin-bottom:0;margin-left:15px}}.card-group{display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column}.card-group>.card{margin-bottom:15px}@media (min-width:576px){.card-group{-ms-flex-flow:row wrap;flex-flow:row wrap}.card-group>.card{-ms-flex:1 0 0%;flex:1 0 0%;margin-bottom:0}.card-group>.card+.card{margin-left:0;border-left:0}.card-group>.card:first-child{border-top-right-radius:0;border-bottom-right-radius:0}.card-group>.card:first-child .card-header,.card-group>.card:first-child .card-img-top{border-top-right-radius:0}.card-group>.card:first-child .card-footer,.card-group>.card:first-child .card-img-bottom{border-bottom-right-radius:0}.card-group>.card:last-child{border-top-left-radius:0;border-bottom-left-radius:0}.card-group>.card:last-child .card-header,.card-group>.card:last-child .card-img-top{border-top-left-radius:0}.card-group>.card:last-child .card-footer,.card-group>.card:last-child .card-img-bottom{border-bottom-left-radius:0}.card-group>.card:only-child{border-radius:.25rem}.card-group>.card:only-child .card-header,.card-group>.card:only-child .card-img-top{border-top-left-radius:.25rem;border-top-right-radius:.25rem}.card-group>.card:only-child .card-footer,.card-group>.card:only-child .card-img-bottom{border-bottom-right-radius:.25rem;border-bottom-left-radius:.25rem}.card-group>.card:not(:first-child):not(:last-child):not(:only-child){border-radius:0}.card-group>.card:not(:first-child):not(:last-child):not(:only-child) .card-footer,.card-group>.card:not(:first-child):not(:last-child):not(:only-child) .card-header,.card-group>.card:not(:first-child):not(:last-child):not(:only-child) .card-img-bottom,.card-group>.card:not(:first-child):not(:last-child):not(:only-child) .card-img-top{border-radius:0}}.card-columns .card{margin-bottom:.75rem}@media (min-width:576px){.card-columns{-webkit-column-count:3;-moz-column-count:3;column-count:3;-webkit-column-gap:1.25rem;-moz-column-gap:1.25rem;column-gap:1.25rem;orphans:1;widows:1}.card-columns .card{display:inline-block;width:100%}}.accordion .card:not(:first-of-type):not(:last-of-type){border-bottom:0;border-radius:0}.accordion .card:not(:first-of-type) .card-header:first-child{border-radius:0}.accordion .card:first-of-type{border-bottom:0;border-bottom-right-radius:0;border-bottom-left-radius:0}.accordion .card:last-of-type{border-top-left-radius:0;border-top-right-radius:0}.breadcrumb{display:-ms-flexbox;display:flex;-ms-flex-wrap:wrap;flex-wrap:wrap;padding:.75rem 1rem;margin-bottom:1rem;list-style:none;background-color:#e9ecef;border-radius:.25rem}.breadcrumb-item+.breadcrumb-item{padding-left:.5rem}.breadcrumb-item+.breadcrumb-item::before{display:inline-block;padding-right:.5rem;color:#6c757d;content:"/"}.breadcrumb-item+.breadcrumb-item:hover::before{text-decoration:underline}.breadcrumb-item+.breadcrumb-item:hover::before{text-decoration:none}.breadcrumb-item.active{color:#6c757d}.pagination{display:-ms-flexbox;display:flex;padding-left:0;list-style:none;border-radius:.25rem}.page-link{position:relative;display:block;padding:.5rem .75rem;margin-left:-1px;line-height:1.25;color:#007bff;background-color:#fff;border:1px solid #dee2e6}.page-link:hover{z-index:2;color:#0056b3;text-decoration:none;background-color:#e9ecef;border-color:#dee2e6}.page-link:focus{z-index:2;outline:0;box-shadow:0 0 0 .2rem rgba(0,123,255,.25)}.page-link:not(:disabled):not(.disabled){cursor:pointer}.page-item:first-child .page-link{margin-left:0;border-top-left-radius:.25rem;border-bottom-left-radius:.25rem}.page-item:last-child .page-link{border-top-right-radius:.25rem;border-bottom-right-radius:.25rem}.page-item.active .page-link{z-index:1;color:#fff;background-color:#007bff;border-color:#007bff}.page-item.disabled .page-link{color:#6c757d;pointer-events:none;cursor:auto;background-color:#fff;border-color:#dee2e6}.pagination-lg .page-link{padding:.75rem 1.5rem;font-size:1.25rem;line-height:1.5}.pagination-lg .page-item:first-child .page-link{border-top-left-radius:.3rem;border-bottom-left-radius:.3rem}.pagination-lg .page-item:last-child .page-link{border-top-right-radius:.3rem;border-bottom-right-radius:.3rem}.pagination-sm .page-link{padding:.25rem .5rem;font-size:.875rem;line-height:1.5}.pagination-sm .page-item:first-child .page-link{border-top-left-radius:.2rem;border-bottom-left-radius:.2rem}.pagination-sm .page-item:last-child .page-link{border-top-right-radius:.2rem;border-bottom-right-radius:.2rem}.badge{display:inline-block;padding:.25em .4em;font-size:75%;font-weight:700;line-height:1;text-align:center;white-space:nowrap;vertical-align:baseline;border-radius:.25rem}.badge:empty{display:none}.btn .badge{position:relative;top:-1px}.badge-pill{padding-right:.6em;padding-left:.6em;border-radius:10rem}.badge-primary{color:#fff;background-color:#007bff}.badge-primary[href]:focus,.badge-primary[href]:hover{color:#fff;text-decoration:none;background-color:#0062cc}.badge-secondary{color:#fff;background-color:#6c757d}.badge-secondary[href]:focus,.badge-secondary[href]:hover{color:#fff;text-decoration:none;background-color:#545b62}.badge-success{color:#fff;background-color:#28a745}.badge-success[href]:focus,.badge-success[href]:hover{color:#fff;text-decoration:none;background-color:#1e7e34}.badge-info{color:#fff;background-color:#17a2b8}.badge-info[href]:focus,.badge-info[href]:hover{color:#fff;text-decoration:none;background-color:#117a8b}.badge-warning{color:#212529;background-color:#ffc107}.badge-warning[href]:focus,.badge-warning[href]:hover{color:#212529;text-decoration:none;background-color:#d39e00}.badge-danger{color:#fff;background-color:#dc3545}.badge-danger[href]:focus,.badge-danger[href]:hover{color:#fff;text-decoration:none;background-color:#bd2130}.badge-light{color:#212529;background-color:#f8f9fa}.badge-light[href]:focus,.badge-light[href]:hover{color:#212529;text-decoration:none;background-color:#dae0e5}.badge-dark{color:#fff;background-color:#343a40}.badge-dark[href]:focus,.badge-dark[href]:hover{color:#fff;text-decoration:none;background-color:#1d2124}.jumbotron{padding:2rem 1rem;margin-bottom:2rem;background-color:#e9ecef;border-radius:.3rem}@media (min-width:576px){.jumbotron{padding:4rem 2rem}}.jumbotron-fluid{padding-right:0;padding-left:0;border-radius:0}.alert{position:relative;padding:.75rem 1.25rem;margin-bottom:1rem;border:1px solid transparent;border-radius:.25rem}.alert-heading{color:inherit}.alert-link{font-weight:700}.alert-dismissible{padding-right:4rem}.alert-dismissible .close{position:absolute;top:0;right:0;padding:.75rem 1.25rem;color:inherit}.alert-primary{color:#004085;background-color:#cce5ff;border-color:#b8daff}.alert-primary hr{border-top-color:#9fcdff}.alert-primary .alert-link{color:#002752}.alert-secondary{color:#383d41;background-color:#e2e3e5;border-color:#d6d8db}.alert-secondary hr{border-top-color:#c8cbcf}.alert-secondary .alert-link{color:#202326}.alert-success{color:#155724;background-color:#d4edda;border-color:#c3e6cb}.alert-success hr{border-top-color:#b1dfbb}.alert-success .alert-link{color:#0b2e13}.alert-info{color:#0c5460;background-color:#d1ecf1;border-color:#bee5eb}.alert-info hr{border-top-color:#abdde5}.alert-info .alert-link{color:#062c33}.alert-warning{color:#856404;background-color:#fff3cd;border-color:#ffeeba}.alert-warning hr{border-top-color:#ffe8a1}.alert-warning .alert-link{color:#533f03}.alert-danger{color:#721c24;background-color:#f8d7da;border-color:#f5c6cb}.alert-danger hr{border-top-color:#f1b0b7}.alert-danger .alert-link{color:#491217}.alert-light{color:#818182;background-color:#fefefe;border-color:#fdfdfe}.alert-light hr{border-top-color:#ececf6}.alert-light .alert-link{color:#686868}.alert-dark{color:#1b1e21;background-color:#d6d8d9;border-color:#c6c8ca}.alert-dark hr{border-top-color:#b9bbbe}.alert-dark .alert-link{color:#040505}@-webkit-keyframes progress-bar-stripes{from{background-position:1rem 0}to{background-position:0 0}}@keyframes progress-bar-stripes{from{background-position:1rem 0}to{background-position:0 0}}.progress{display:-ms-flexbox;display:flex;height:1rem;overflow:hidden;font-size:.75rem;background-color:#e9ecef;border-radius:.25rem}.progress-bar{display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column;-ms-flex-pack:center;justify-content:center;color:#fff;text-align:center;white-space:nowrap;background-color:#007bff;transition:width .6s ease}@media screen and (prefers-reduced-motion:reduce){.progress-bar{transition:none}}.progress-bar-striped{background-image:linear-gradient(45deg,rgba(255,255,255,.15) 25%,transparent 25%,transparent 50%,rgba(255,255,255,.15) 50%,rgba(255,255,255,.15) 75%,transparent 75%,transparent);background-size:1rem 1rem}.progress-bar-animated{-webkit-animation:progress-bar-stripes 1s linear infinite;animation:progress-bar-stripes 1s linear infinite}.media{display:-ms-flexbox;display:flex;-ms-flex-align:start;align-items:flex-start}.media-body{-ms-flex:1;flex:1}.list-group{display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column;padding-left:0;margin-bottom:0}.list-group-item-action{width:100%;color:#495057;text-align:inherit}.list-group-item-action:focus,.list-group-item-action:hover{color:#495057;text-decoration:none;background-color:#f8f9fa}.list-group-item-action:active{color:#212529;background-color:#e9ecef}.list-group-item{position:relative;display:block;padding:.75rem 1.25rem;margin-bottom:-1px;background-color:#fff;border:1px solid rgba(0,0,0,.125)}.list-group-item:first-child{border-top-left-radius:.25rem;border-top-right-radius:.25rem}.list-group-item:last-child{margin-bottom:0;border-bottom-right-radius:.25rem;border-bottom-left-radius:.25rem}.list-group-item:focus,.list-group-item:hover{z-index:1;text-decoration:none}.list-group-item.disabled,.list-group-item:disabled{color:#6c757d;background-color:#fff}.list-group-item.active{z-index:2;color:#fff;background-color:#007bff;border-color:#007bff}.list-group-flush .list-group-item{border-right:0;border-left:0;border-radius:0}.list-group-flush:first-child .list-group-item:first-child{border-top:0}.list-group-flush:last-child .list-group-item:last-child{border-bottom:0}.list-group-item-primary{color:#004085;background-color:#b8daff}.list-group-item-primary.list-group-item-action:focus,.list-group-item-primary.list-group-item-action:hover{color:#004085;background-color:#9fcdff}.list-group-item-primary.list-group-item-action.active{color:#fff;background-color:#004085;border-color:#004085}.list-group-item-secondary{color:#383d41;background-color:#d6d8db}.list-group-item-secondary.list-group-item-action:focus,.list-group-item-secondary.list-group-item-action:hover{color:#383d41;background-color:#c8cbcf}.list-group-item-secondary.list-group-item-action.active{color:#fff;background-color:#383d41;border-color:#383d41}.list-group-item-success{color:#155724;background-color:#c3e6cb}.list-group-item-success.list-group-item-action:focus,.list-group-item-success.list-group-item-action:hover{color:#155724;background-color:#b1dfbb}.list-group-item-success.list-group-item-action.active{color:#fff;background-color:#155724;border-color:#155724}.list-group-item-info{color:#0c5460;background-color:#bee5eb}.list-group-item-info.list-group-item-action:focus,.list-group-item-info.list-group-item-action:hover{color:#0c5460;background-color:#abdde5}.list-group-item-info.list-group-item-action.active{color:#fff;background-color:#0c5460;border-color:#0c5460}.list-group-item-warning{color:#856404;background-color:#ffeeba}.list-group-item-warning.list-group-item-action:focus,.list-group-item-warning.list-group-item-action:hover{color:#856404;background-color:#ffe8a1}.list-group-item-warning.list-group-item-action.active{color:#fff;background-color:#856404;border-color:#856404}.list-group-item-danger{color:#721c24;background-color:#f5c6cb}.list-group-item-danger.list-group-item-action:focus,.list-group-item-danger.list-group-item-action:hover{color:#721c24;background-color:#f1b0b7}.list-group-item-danger.list-group-item-action.active{color:#fff;background-color:#721c24;border-color:#721c24}.list-group-item-light{color:#818182;background-color:#fdfdfe}.list-group-item-light.list-group-item-action:focus,.list-group-item-light.list-group-item-action:hover{color:#818182;background-color:#ececf6}.list-group-item-light.list-group-item-action.active{color:#fff;background-color:#818182;border-color:#818182}.list-group-item-dark{color:#1b1e21;background-color:#c6c8ca}.list-group-item-dark.list-group-item-action:focus,.list-group-item-dark.list-group-item-action:hover{color:#1b1e21;background-color:#b9bbbe}.list-group-item-dark.list-group-item-action.active{color:#fff;background-color:#1b1e21;border-color:#1b1e21}.close{float:right;font-size:1.5rem;font-weight:700;line-height:1;color:#000;text-shadow:0 1px 0 #fff;opacity:.5}.close:focus,.close:hover{color:#000;text-decoration:none;opacity:.75}.close:not(:disabled):not(.disabled){cursor:pointer}button.close{padding:0;background-color:transparent;border:0;-webkit-appearance:none}.modal-open{overflow:hidden}.modal{position:fixed;top:0;right:0;bottom:0;left:0;z-index:1050;display:none;overflow:hidden;outline:0}.modal-open .modal{overflow-x:hidden;overflow-y:auto}.modal-dialog{position:relative;width:auto;margin:.5rem;pointer-events:none}.modal.fade .modal-dialog{transition:-webkit-transform .3s ease-out;transition:transform .3s ease-out;transition:transform .3s ease-out,-webkit-transform .3s ease-out;-webkit-transform:translate(0,-25%);transform:translate(0,-25%)}@media screen and (prefers-reduced-motion:reduce){.modal.fade .modal-dialog{transition:none}}.modal.show .modal-dialog{-webkit-transform:translate(0,0);transform:translate(0,0)}.modal-dialog-centered{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;min-height:calc(100% - (.5rem * 2))}.modal-content{position:relative;display:-ms-flexbox;display:flex;-ms-flex-direction:column;flex-direction:column;width:100%;pointer-events:auto;background-color:#fff;background-clip:padding-box;border:1px solid rgba(0,0,0,.2);border-radius:.3rem;outline:0}.modal-backdrop{position:fixed;top:0;right:0;bottom:0;left:0;z-index:1040;background-color:#000}.modal-backdrop.fade{opacity:0}.modal-backdrop.show{opacity:.5}.modal-header{display:-ms-flexbox;display:flex;-ms-flex-align:start;align-items:flex-start;-ms-flex-pack:justify;justify-content:space-between;padding:1rem;border-bottom:1px solid #e9ecef;border-top-left-radius:.3rem;border-top-right-radius:.3rem}.modal-header .close{padding:1rem;margin:-1rem -1rem -1rem auto}.modal-title{margin-bottom:0;line-height:1.5}.modal-body{position:relative;-ms-flex:1 1 auto;flex:1 1 auto;padding:1rem}.modal-footer{display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;-ms-flex-pack:end;justify-content:flex-end;padding:1rem;border-top:1px solid #e9ecef}.modal-footer>:not(:first-child){margin-left:.25rem}.modal-footer>:not(:last-child){margin-right:.25rem}.modal-scrollbar-measure{position:absolute;top:-9999px;width:50px;height:50px;overflow:scroll}@media (min-width:576px){.modal-dialog{max-width:500px;margin:1.75rem auto}.modal-dialog-centered{min-height:calc(100% - (1.75rem * 2))}.modal-sm{max-width:300px}}@media (min-width:992px){.modal-lg{max-width:800px}}.tooltip{position:absolute;z-index:1070;display:block;margin:0;font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,"Helvetica Neue",Arial,sans-serif,"Apple Color Emoji","Segoe UI Emoji","Segoe UI Symbol";font-style:normal;font-weight:400;line-height:1.5;text-align:left;text-align:start;text-decoration:none;text-shadow:none;text-transform:none;letter-spacing:normal;word-break:normal;word-spacing:normal;white-space:normal;line-break:auto;font-size:.875rem;word-wrap:break-word;opacity:0}.tooltip.show{opacity:.9}.tooltip .arrow{position:absolute;display:block;width:.8rem;height:.4rem}.tooltip .arrow::before{position:absolute;content:"";border-color:transparent;border-style:solid}.bs-tooltip-auto[x-placement^=top],.bs-tooltip-top{padding:.4rem 0}.bs-tooltip-auto[x-placement^=top] .arrow,.bs-tooltip-top .arrow{bottom:0}.bs-tooltip-auto[x-placement^=top] .arrow::before,.bs-tooltip-top .arrow::before{top:0;border-width:.4rem .4rem 0;border-top-color:#000}.bs-tooltip-auto[x-placement^=right],.bs-tooltip-right{padding:0 .4rem}.bs-tooltip-auto[x-placement^=right] .arrow,.bs-tooltip-right .arrow{left:0;width:.4rem;height:.8rem}.bs-tooltip-auto[x-placement^=right] .arrow::before,.bs-tooltip-right .arrow::before{right:0;border-width:.4rem .4rem .4rem 0;border-right-color:#000}.bs-tooltip-auto[x-placement^=bottom],.bs-tooltip-bottom{padding:.4rem 0}.bs-tooltip-auto[x-placement^=bottom] .arrow,.bs-tooltip-bottom .arrow{top:0}.bs-tooltip-auto[x-placement^=bottom] .arrow::before,.bs-tooltip-bottom .arrow::before{bottom:0;border-width:0 .4rem .4rem;border-bottom-color:#000}.bs-tooltip-auto[x-placement^=left],.bs-tooltip-left{padding:0 .4rem}.bs-tooltip-auto[x-placement^=left] .arrow,.bs-tooltip-left .arrow{right:0;width:.4rem;height:.8rem}.bs-tooltip-auto[x-placement^=left] .arrow::before,.bs-tooltip-left .arrow::before{left:0;border-width:.4rem 0 .4rem .4rem;border-left-color:#000}.tooltip-inner{max-width:200px;padding:.25rem .5rem;color:#fff;text-align:center;background-color:#000;border-radius:.25rem}.popover{position:absolute;top:0;left:0;z-index:1060;display:block;max-width:276px;font-family:-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,"Helvetica Neue",Arial,sans-serif,"Apple Color Emoji","Segoe UI Emoji","Segoe UI Symbol";font-style:normal;font-weight:400;line-height:1.5;text-align:left;text-align:start;text-decoration:none;text-shadow:none;text-transform:none;letter-spacing:normal;word-break:normal;word-spacing:normal;white-space:normal;line-break:auto;font-size:.875rem;word-wrap:break-word;background-color:#fff;background-clip:padding-box;border:1px solid rgba(0,0,0,.2);border-radius:.3rem}.popover .arrow{position:absolute;display:block;width:1rem;height:.5rem;margin:0 .3rem}.popover .arrow::after,.popover .arrow::before{position:absolute;display:block;content:"";border-color:transparent;border-style:solid}.bs-popover-auto[x-placement^=top],.bs-popover-top{margin-bottom:.5rem}.bs-popover-auto[x-placement^=top] .arrow,.bs-popover-top .arrow{bottom:calc((.5rem + 1px) * -1)}.bs-popover-auto[x-placement^=top] .arrow::after,.bs-popover-auto[x-placement^=top] .arrow::before,.bs-popover-top .arrow::after,.bs-popover-top .arrow::before{border-width:.5rem .5rem 0}.bs-popover-auto[x-placement^=top] .arrow::before,.bs-popover-top .arrow::before{bottom:0;border-top-color:rgba(0,0,0,.25)}.bs-popover-auto[x-placement^=top] .arrow::after,.bs-popover-top .arrow::after{bottom:1px;border-top-color:#fff}.bs-popover-auto[x-placement^=right],.bs-popover-right{margin-left:.5rem}.bs-popover-auto[x-placement^=right] .arrow,.bs-popover-right .arrow{left:calc((.5rem + 1px) * -1);width:.5rem;height:1rem;margin:.3rem 0}.bs-popover-auto[x-placement^=right] .arrow::after,.bs-popover-auto[x-placement^=right] .arrow::before,.bs-popover-right .arrow::after,.bs-popover-right .arrow::before{border-width:.5rem .5rem .5rem 0}.bs-popover-auto[x-placement^=right] .arrow::before,.bs-popover-right .arrow::before{left:0;border-right-color:rgba(0,0,0,.25)}.bs-popover-auto[x-placement^=right] .arrow::after,.bs-popover-right .arrow::after{left:1px;border-right-color:#fff}.bs-popover-auto[x-placement^=bottom],.bs-popover-bottom{margin-top:.5rem}.bs-popover-auto[x-placement^=bottom] .arrow,.bs-popover-bottom .arrow{top:calc((.5rem + 1px) * -1)}.bs-popover-auto[x-placement^=bottom] .arrow::after,.bs-popover-auto[x-placement^=bottom] .arrow::before,.bs-popover-bottom .arrow::after,.bs-popover-bottom .arrow::before{border-width:0 .5rem .5rem .5rem}.bs-popover-auto[x-placement^=bottom] .arrow::before,.bs-popover-bottom .arrow::before{top:0;border-bottom-color:rgba(0,0,0,.25)}.bs-popover-auto[x-placement^=bottom] .arrow::after,.bs-popover-bottom .arrow::after{top:1px;border-bottom-color:#fff}.bs-popover-auto[x-placement^=bottom] .popover-header::before,.bs-popover-bottom .popover-header::before{position:absolute;top:0;left:50%;display:block;width:1rem;margin-left:-.5rem;content:"";border-bottom:1px solid #f7f7f7}.bs-popover-auto[x-placement^=left],.bs-popover-left{margin-right:.5rem}.bs-popover-auto[x-placement^=left] .arrow,.bs-popover-left .arrow{right:calc((.5rem + 1px) * -1);width:.5rem;height:1rem;margin:.3rem 0}.bs-popover-auto[x-placement^=left] .arrow::after,.bs-popover-auto[x-placement^=left] .arrow::before,.bs-popover-left .arrow::after,.bs-popover-left .arrow::before{border-width:.5rem 0 .5rem .5rem}.bs-popover-auto[x-placement^=left] .arrow::before,.bs-popover-left .arrow::before{right:0;border-left-color:rgba(0,0,0,.25)}.bs-popover-auto[x-placement^=left] .arrow::after,.bs-popover-left .arrow::after{right:1px;border-left-color:#fff}.popover-header{padding:.5rem .75rem;margin-bottom:0;font-size:1rem;color:inherit;background-color:#f7f7f7;border-bottom:1px solid #ebebeb;border-top-left-radius:calc(.3rem - 1px);border-top-right-radius:calc(.3rem - 1px)}.popover-header:empty{display:none}.popover-body{padding:.5rem .75rem;color:#212529}.carousel{position:relative}.carousel-inner{position:relative;width:100%;overflow:hidden}.carousel-item{position:relative;display:none;-ms-flex-align:center;align-items:center;width:100%;transition:-webkit-transform .6s ease;transition:transform .6s ease;transition:transform .6s ease,-webkit-transform .6s ease;-webkit-backface-visibility:hidden;backface-visibility:hidden;-webkit-perspective:1000px;perspective:1000px}@media screen and (prefers-reduced-motion:reduce){.carousel-item{transition:none}}.carousel-item-next,.carousel-item-prev,.carousel-item.active{display:block}.carousel-item-next,.carousel-item-prev{position:absolute;top:0}.carousel-item-next.carousel-item-left,.carousel-item-prev.carousel-item-right{-webkit-transform:translateX(0);transform:translateX(0)}@supports ((-webkit-transform-style:preserve-3d) or (transform-style:preserve-3d)){.carousel-item-next.carousel-item-left,.carousel-item-prev.carousel-item-right{-webkit-transform:translate3d(0,0,0);transform:translate3d(0,0,0)}}.active.carousel-item-right,.carousel-item-next{-webkit-transform:translateX(100%);transform:translateX(100%)}@supports ((-webkit-transform-style:preserve-3d) or (transform-style:preserve-3d)){.active.carousel-item-right,.carousel-item-next{-webkit-transform:translate3d(100%,0,0);transform:translate3d(100%,0,0)}}.active.carousel-item-left,.carousel-item-prev{-webkit-transform:translateX(-100%);transform:translateX(-100%)}@supports ((-webkit-transform-style:preserve-3d) or (transform-style:preserve-3d)){.active.carousel-item-left,.carousel-item-prev{-webkit-transform:translate3d(-100%,0,0);transform:translate3d(-100%,0,0)}}.carousel-fade .carousel-item{opacity:0;transition-duration:.6s;transition-property:opacity}.carousel-fade .carousel-item-next.carousel-item-left,.carousel-fade .carousel-item-prev.carousel-item-right,.carousel-fade .carousel-item.active{opacity:1}.carousel-fade .active.carousel-item-left,.carousel-fade .active.carousel-item-right{opacity:0}.carousel-fade .active.carousel-item-left,.carousel-fade .active.carousel-item-prev,.carousel-fade .carousel-item-next,.carousel-fade .carousel-item-prev,.carousel-fade .carousel-item.active{-webkit-transform:translateX(0);transform:translateX(0)}@supports ((-webkit-transform-style:preserve-3d) or (transform-style:preserve-3d)){.carousel-fade .active.carousel-item-left,.carousel-fade .active.carousel-item-prev,.carousel-fade .carousel-item-next,.carousel-fade .carousel-item-prev,.carousel-fade .carousel-item.active{-webkit-transform:translate3d(0,0,0);transform:translate3d(0,0,0)}}.carousel-control-next,.carousel-control-prev{position:absolute;top:0;bottom:0;display:-ms-flexbox;display:flex;-ms-flex-align:center;align-items:center;-ms-flex-pack:center;justify-content:center;width:15%;color:#fff;text-align:center;opacity:.5}.carousel-control-next:focus,.carousel-control-next:hover,.carousel-control-prev:focus,.carousel-control-prev:hover{color:#fff;text-decoration:none;outline:0;opacity:.9}.carousel-control-prev{left:0}.carousel-control-next{right:0}.carousel-control-next-icon,.carousel-control-prev-icon{display:inline-block;width:20px;height:20px;background:transparent no-repeat center center;background-size:100% 100%}.carousel-control-prev-icon{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' fill='%23fff' viewBox='0 0 8 8'%3E%3Cpath d='M5.25 0l-4 4 4 4 1.5-1.5-2.5-2.5 2.5-2.5-1.5-1.5z'/%3E%3C/svg%3E")}.carousel-control-next-icon{background-image:url("data:image/svg+xml;charset=utf8,%3Csvg xmlns='http://www.w3.org/2000/svg' fill='%23fff' viewBox='0 0 8 8'%3E%3Cpath d='M2.75 0l-1.5 1.5 2.5 2.5-2.5 2.5 1.5 1.5 4-4-4-4z'/%3E%3C/svg%3E")}.carousel-indicators{position:absolute;right:0;bottom:10px;left:0;z-index:15;display:-ms-flexbox;display:flex;-ms-flex-pack:center;justify-content:center;padding-left:0;margin-right:15%;margin-left:15%;list-style:none}.carousel-indicators li{position:relative;-ms-flex:0 1 auto;flex:0 1 auto;width:30px;height:3px;margin-right:3px;margin-left:3px;text-indent:-999px;cursor:pointer;background-color:rgba(255,255,255,.5)}.carousel-indicators li::before{position:absolute;top:-10px;left:0;display:inline-block;width:100%;height:10px;content:""}.carousel-indicators li::after{position:absolute;bottom:-10px;left:0;display:inline-block;width:100%;height:10px;content:""}.carousel-indicators .active{background-color:#fff}.carousel-caption{position:absolute;right:15%;bottom:20px;left:15%;z-index:10;padding-top:20px;padding-bottom:20px;color:#fff;text-align:center}.align-baseline{vertical-align:baseline!important}.align-top{vertical-align:top!important}.align-middle{vertical-align:middle!important}.align-bottom{vertical-align:bottom!important}.align-text-bottom{vertical-align:text-bottom!important}.align-text-top{vertical-align:text-top!important}.bg-primary{background-color:#007bff!important}a.bg-primary:focus,a.bg-primary:hover,button.bg-primary:focus,button.bg-primary:hover{background-color:#0062cc!important}.bg-secondary{background-color:#6c757d!important}a.bg-secondary:focus,a.bg-secondary:hover,button.bg-secondary:focus,button.bg-secondary:hover{background-color:#545b62!important}.bg-success{background-color:#28a745!important}a.bg-success:focus,a.bg-success:hover,button.bg-success:focus,button.bg-success:hover{background-color:#1e7e34!important}.bg-info{background-color:#17a2b8!important}a.bg-info:focus,a.bg-info:hover,button.bg-info:focus,button.bg-info:hover{background-color:#117a8b!important}.bg-warning{background-color:#ffc107!important}a.bg-warning:focus,a.bg-warning:hover,button.bg-warning:focus,button.bg-warning:hover{background-color:#d39e00!important}.bg-danger{background-color:#dc3545!important}a.bg-danger:focus,a.bg-danger:hover,button.bg-danger:focus,button.bg-danger:hover{background-color:#bd2130!important}.bg-light{background-color:#f8f9fa!important}a.bg-light:focus,a.bg-light:hover,button.bg-light:focus,button.bg-light:hover{background-color:#dae0e5!important}.bg-dark{background-color:#343a40!important}a.bg-dark:focus,a.bg-dark:hover,button.bg-dark:focus,button.bg-dark:hover{background-color:#1d2124!important}.bg-white{background-color:#fff!important}.bg-transparent{background-color:transparent!important}.border{border:1px solid #dee2e6!important}.border-top{border-top:1px solid #dee2e6!important}.border-right{border-right:1px solid #dee2e6!important}.border-bottom{border-bottom:1px solid #dee2e6!important}.border-left{border-left:1px solid #dee2e6!important}.border-0{border:0!important}.border-top-0{border-top:0!important}.border-right-0{border-right:0!important}.border-bottom-0{border-bottom:0!important}.border-left-0{border-left:0!important}.border-primary{border-color:#007bff!important}.border-secondary{border-color:#6c757d!important}.border-success{border-color:#28a745!important}.border-info{border-color:#17a2b8!important}.border-warning{border-color:#ffc107!important}.border-danger{border-color:#dc3545!important}.border-light{border-color:#f8f9fa!important}.border-dark{border-color:#343a40!important}.border-white{border-color:#fff!important}.rounded{border-radius:.25rem!important}.rounded-top{border-top-left-radius:.25rem!important;border-top-right-radius:.25rem!important}.rounded-right{border-top-right-radius:.25rem!important;border-bottom-right-radius:.25rem!important}.rounded-bottom{border-bottom-right-radius:.25rem!important;border-bottom-left-radius:.25rem!important}.rounded-left{border-top-left-radius:.25rem!important;border-bottom-left-radius:.25rem!important}.rounded-circle{border-radius:50%!important}.rounded-0{border-radius:0!important}.clearfix::after{display:block;clear:both;content:""}.d-none{display:none!important}.d-inline{display:inline!important}.d-inline-block{display:inline-block!important}.d-block{display:block!important}.d-table{display:table!important}.d-table-row{display:table-row!important}.d-table-cell{display:table-cell!important}.d-flex{display:-ms-flexbox!important;display:flex!important}.d-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}@media (min-width:576px){.d-sm-none{display:none!important}.d-sm-inline{display:inline!important}.d-sm-inline-block{display:inline-block!important}.d-sm-block{display:block!important}.d-sm-table{display:table!important}.d-sm-table-row{display:table-row!important}.d-sm-table-cell{display:table-cell!important}.d-sm-flex{display:-ms-flexbox!important;display:flex!important}.d-sm-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}}@media (min-width:768px){.d-md-none{display:none!important}.d-md-inline{display:inline!important}.d-md-inline-block{display:inline-block!important}.d-md-block{display:block!important}.d-md-table{display:table!important}.d-md-table-row{display:table-row!important}.d-md-table-cell{display:table-cell!important}.d-md-flex{display:-ms-flexbox!important;display:flex!important}.d-md-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}}@media (min-width:992px){.d-lg-none{display:none!important}.d-lg-inline{display:inline!important}.d-lg-inline-block{display:inline-block!important}.d-lg-block{display:block!important}.d-lg-table{display:table!important}.d-lg-table-row{display:table-row!important}.d-lg-table-cell{display:table-cell!important}.d-lg-flex{display:-ms-flexbox!important;display:flex!important}.d-lg-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}}@media (min-width:1200px){.d-xl-none{display:none!important}.d-xl-inline{display:inline!important}.d-xl-inline-block{display:inline-block!important}.d-xl-block{display:block!important}.d-xl-table{display:table!important}.d-xl-table-row{display:table-row!important}.d-xl-table-cell{display:table-cell!important}.d-xl-flex{display:-ms-flexbox!important;display:flex!important}.d-xl-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}}@media print{.d-print-none{display:none!important}.d-print-inline{display:inline!important}.d-print-inline-block{display:inline-block!important}.d-print-block{display:block!important}.d-print-table{display:table!important}.d-print-table-row{display:table-row!important}.d-print-table-cell{display:table-cell!important}.d-print-flex{display:-ms-flexbox!important;display:flex!important}.d-print-inline-flex{display:-ms-inline-flexbox!important;display:inline-flex!important}}.embed-responsive{position:relative;display:block;width:100%;padding:0;overflow:hidden}.embed-responsive::before{display:block;content:""}.embed-responsive .embed-responsive-item,.embed-responsive embed,.embed-responsive iframe,.embed-responsive object,.embed-responsive video{position:absolute;top:0;bottom:0;left:0;width:100%;height:100%;border:0}.embed-responsive-21by9::before{padding-top:42.857143%}.embed-responsive-16by9::before{padding-top:56.25%}.embed-responsive-4by3::before{padding-top:75%}.embed-responsive-1by1::before{padding-top:100%}.flex-row{-ms-flex-direction:row!important;flex-direction:row!important}.flex-column{-ms-flex-direction:column!important;flex-direction:column!important}.flex-row-reverse{-ms-flex-direction:row-reverse!important;flex-direction:row-reverse!important}.flex-column-reverse{-ms-flex-direction:column-reverse!important;flex-direction:column-reverse!important}.flex-wrap{-ms-flex-wrap:wrap!important;flex-wrap:wrap!important}.flex-nowrap{-ms-flex-wrap:nowrap!important;flex-wrap:nowrap!important}.flex-wrap-reverse{-ms-flex-wrap:wrap-reverse!important;flex-wrap:wrap-reverse!important}.flex-fill{-ms-flex:1 1 auto!important;flex:1 1 auto!important}.flex-grow-0{-ms-flex-positive:0!important;flex-grow:0!important}.flex-grow-1{-ms-flex-positive:1!important;flex-grow:1!important}.flex-shrink-0{-ms-flex-negative:0!important;flex-shrink:0!important}.flex-shrink-1{-ms-flex-negative:1!important;flex-shrink:1!important}.justify-content-start{-ms-flex-pack:start!important;justify-content:flex-start!important}.justify-content-end{-ms-flex-pack:end!important;justify-content:flex-end!important}.justify-content-center{-ms-flex-pack:center!important;justify-content:center!important}.justify-content-between{-ms-flex-pack:justify!important;justify-content:space-between!important}.justify-content-around{-ms-flex-pack:distribute!important;justify-content:space-around!important}.align-items-start{-ms-flex-align:start!important;align-items:flex-start!important}.align-items-end{-ms-flex-align:end!important;align-items:flex-end!important}.align-items-center{-ms-flex-align:center!important;align-items:center!important}.align-items-baseline{-ms-flex-align:baseline!important;align-items:baseline!important}.align-items-stretch{-ms-flex-align:stretch!important;align-items:stretch!important}.align-content-start{-ms-flex-line-pack:start!important;align-content:flex-start!important}.align-content-end{-ms-flex-line-pack:end!important;align-content:flex-end!important}.align-content-center{-ms-flex-line-pack:center!important;align-content:center!important}.align-content-between{-ms-flex-line-pack:justify!important;align-content:space-between!important}.align-content-around{-ms-flex-line-pack:distribute!important;align-content:space-around!important}.align-content-stretch{-ms-flex-line-pack:stretch!important;align-content:stretch!important}.align-self-auto{-ms-flex-item-align:auto!important;align-self:auto!important}.align-self-start{-ms-flex-item-align:start!important;align-self:flex-start!important}.align-self-end{-ms-flex-item-align:end!important;align-self:flex-end!important}.align-self-center{-ms-flex-item-align:center!important;align-self:center!important}.align-self-baseline{-ms-flex-item-align:baseline!important;align-self:baseline!important}.align-self-stretch{-ms-flex-item-align:stretch!important;align-self:stretch!important}@media (min-width:576px){.flex-sm-row{-ms-flex-direction:row!important;flex-direction:row!important}.flex-sm-column{-ms-flex-direction:column!important;flex-direction:column!important}.flex-sm-row-reverse{-ms-flex-direction:row-reverse!important;flex-direction:row-reverse!important}.flex-sm-column-reverse{-ms-flex-direction:column-reverse!important;flex-direction:column-reverse!important}.flex-sm-wrap{-ms-flex-wrap:wrap!important;flex-wrap:wrap!important}.flex-sm-nowrap{-ms-flex-wrap:nowrap!important;flex-wrap:nowrap!important}.flex-sm-wrap-reverse{-ms-flex-wrap:wrap-reverse!important;flex-wrap:wrap-reverse!important}.flex-sm-fill{-ms-flex:1 1 auto!important;flex:1 1 auto!important}.flex-sm-grow-0{-ms-flex-positive:0!important;flex-grow:0!important}.flex-sm-grow-1{-ms-flex-positive:1!important;flex-grow:1!important}.flex-sm-shrink-0{-ms-flex-negative:0!important;flex-shrink:0!important}.flex-sm-shrink-1{-ms-flex-negative:1!important;flex-shrink:1!important}.justify-content-sm-start{-ms-flex-pack:start!important;justify-content:flex-start!important}.justify-content-sm-end{-ms-flex-pack:end!important;justify-content:flex-end!important}.justify-content-sm-center{-ms-flex-pack:center!important;justify-content:center!important}.justify-content-sm-between{-ms-flex-pack:justify!important;justify-content:space-between!important}.justify-content-sm-around{-ms-flex-pack:distribute!important;justify-content:space-around!important}.align-items-sm-start{-ms-flex-align:start!important;align-items:flex-start!important}.align-items-sm-end{-ms-flex-align:end!important;align-items:flex-end!important}.align-items-sm-center{-ms-flex-align:center!important;align-items:center!important}.align-items-sm-baseline{-ms-flex-align:baseline!important;align-items:baseline!important}.align-items-sm-stretch{-ms-flex-align:stretch!important;align-items:stretch!important}.align-content-sm-start{-ms-flex-line-pack:start!important;align-content:flex-start!important}.align-content-sm-end{-ms-flex-line-pack:end!important;align-content:flex-end!important}.align-content-sm-center{-ms-flex-line-pack:center!important;align-content:center!important}.align-content-sm-between{-ms-flex-line-pack:justify!important;align-content:space-between!important}.align-content-sm-around{-ms-flex-line-pack:distribute!important;align-content:space-around!important}.align-content-sm-stretch{-ms-flex-line-pack:stretch!important;align-content:stretch!important}.align-self-sm-auto{-ms-flex-item-align:auto!important;align-self:auto!important}.align-self-sm-start{-ms-flex-item-align:start!important;align-self:flex-start!important}.align-self-sm-end{-ms-flex-item-align:end!important;align-self:flex-end!important}.align-self-sm-center{-ms-flex-item-align:center!important;align-self:center!important}.align-self-sm-baseline{-ms-flex-item-align:baseline!important;align-self:baseline!important}.align-self-sm-stretch{-ms-flex-item-align:stretch!important;align-self:stretch!important}}@media (min-width:768px){.flex-md-row{-ms-flex-direction:row!important;flex-direction:row!important}.flex-md-column{-ms-flex-direction:column!important;flex-direction:column!important}.flex-md-row-reverse{-ms-flex-direction:row-reverse!important;flex-direction:row-reverse!important}.flex-md-column-reverse{-ms-flex-direction:column-reverse!important;flex-direction:column-reverse!important}.flex-md-wrap{-ms-flex-wrap:wrap!important;flex-wrap:wrap!important}.flex-md-nowrap{-ms-flex-wrap:nowrap!important;flex-wrap:nowrap!important}.flex-md-wrap-reverse{-ms-flex-wrap:wrap-reverse!important;flex-wrap:wrap-reverse!important}.flex-md-fill{-ms-flex:1 1 auto!important;flex:1 1 auto!important}.flex-md-grow-0{-ms-flex-positive:0!important;flex-grow:0!important}.flex-md-grow-1{-ms-flex-positive:1!important;flex-grow:1!important}.flex-md-shrink-0{-ms-flex-negative:0!important;flex-shrink:0!important}.flex-md-shrink-1{-ms-flex-negative:1!important;flex-shrink:1!important}.justify-content-md-start{-ms-flex-pack:start!important;justify-content:flex-start!important}.justify-content-md-end{-ms-flex-pack:end!important;justify-content:flex-end!important}.justify-content-md-center{-ms-flex-pack:center!important;justify-content:center!important}.justify-content-md-between{-ms-flex-pack:justify!important;justify-content:space-between!important}.justify-content-md-around{-ms-flex-pack:distribute!important;justify-content:space-around!important}.align-items-md-start{-ms-flex-align:start!important;align-items:flex-start!important}.align-items-md-end{-ms-flex-align:end!important;align-items:flex-end!important}.align-items-md-center{-ms-flex-align:center!important;align-items:center!important}.align-items-md-baseline{-ms-flex-align:baseline!important;align-items:baseline!important}.align-items-md-stretch{-ms-flex-align:stretch!important;align-items:stretch!important}.align-content-md-start{-ms-flex-line-pack:start!important;align-content:flex-start!important}.align-content-md-end{-ms-flex-line-pack:end!important;align-content:flex-end!important}.align-content-md-center{-ms-flex-line-pack:center!important;align-content:center!important}.align-content-md-between{-ms-flex-line-pack:justify!important;align-content:space-between!important}.align-content-md-around{-ms-flex-line-pack:distribute!important;align-content:space-around!important}.align-content-md-stretch{-ms-flex-line-pack:stretch!important;align-content:stretch!important}.align-self-md-auto{-ms-flex-item-align:auto!important;align-self:auto!important}.align-self-md-start{-ms-flex-item-align:start!important;align-self:flex-start!important}.align-self-md-end{-ms-flex-item-align:end!important;align-self:flex-end!important}.align-self-md-center{-ms-flex-item-align:center!important;align-self:center!important}.align-self-md-baseline{-ms-flex-item-align:baseline!important;align-self:baseline!important}.align-self-md-stretch{-ms-flex-item-align:stretch!important;align-self:stretch!important}}@media (min-width:992px){.flex-lg-row{-ms-flex-direction:row!important;flex-direction:row!important}.flex-lg-column{-ms-flex-direction:column!important;flex-direction:column!important}.flex-lg-row-reverse{-ms-flex-direction:row-reverse!important;flex-direction:row-reverse!important}.flex-lg-column-reverse{-ms-flex-direction:column-reverse!important;flex-direction:column-reverse!important}.flex-lg-wrap{-ms-flex-wrap:wrap!important;flex-wrap:wrap!important}.flex-lg-nowrap{-ms-flex-wrap:nowrap!important;flex-wrap:nowrap!important}.flex-lg-wrap-reverse{-ms-flex-wrap:wrap-reverse!important;flex-wrap:wrap-reverse!important}.flex-lg-fill{-ms-flex:1 1 auto!important;flex:1 1 auto!important}.flex-lg-grow-0{-ms-flex-positive:0!important;flex-grow:0!important}.flex-lg-grow-1{-ms-flex-positive:1!important;flex-grow:1!important}.flex-lg-shrink-0{-ms-flex-negative:0!important;flex-shrink:0!important}.flex-lg-shrink-1{-ms-flex-negative:1!important;flex-shrink:1!important}.justify-content-lg-start{-ms-flex-pack:start!important;justify-content:flex-start!important}.justify-content-lg-end{-ms-flex-pack:end!important;justify-content:flex-end!important}.justify-content-lg-center{-ms-flex-pack:center!important;justify-content:center!important}.justify-content-lg-between{-ms-flex-pack:justify!important;justify-content:space-between!important}.justify-content-lg-around{-ms-flex-pack:distribute!important;justify-content:space-around!important}.align-items-lg-start{-ms-flex-align:start!important;align-items:flex-start!important}.align-items-lg-end{-ms-flex-align:end!important;align-items:flex-end!important}.align-items-lg-center{-ms-flex-align:center!important;align-items:center!important}.align-items-lg-baseline{-ms-flex-align:baseline!important;align-items:baseline!important}.align-items-lg-stretch{-ms-flex-align:stretch!important;align-items:stretch!important}.align-content-lg-start{-ms-flex-line-pack:start!important;align-content:flex-start!important}.align-content-lg-end{-ms-flex-line-pack:end!important;align-content:flex-end!important}.align-content-lg-center{-ms-flex-line-pack:center!important;align-content:center!important}.align-content-lg-between{-ms-flex-line-pack:justify!important;align-content:space-between!important}.align-content-lg-around{-ms-flex-line-pack:distribute!important;align-content:space-around!important}.align-content-lg-stretch{-ms-flex-line-pack:stretch!important;align-content:stretch!important}.align-self-lg-auto{-ms-flex-item-align:auto!important;align-self:auto!important}.align-self-lg-start{-ms-flex-item-align:start!important;align-self:flex-start!important}.align-self-lg-end{-ms-flex-item-align:end!important;align-self:flex-end!important}.align-self-lg-center{-ms-flex-item-align:center!important;align-self:center!important}.align-self-lg-baseline{-ms-flex-item-align:baseline!important;align-self:baseline!important}.align-self-lg-stretch{-ms-flex-item-align:stretch!important;align-self:stretch!important}}@media (min-width:1200px){.flex-xl-row{-ms-flex-direction:row!important;flex-direction:row!important}.flex-xl-column{-ms-flex-direction:column!important;flex-direction:column!important}.flex-xl-row-reverse{-ms-flex-direction:row-reverse!important;flex-direction:row-reverse!important}.flex-xl-column-reverse{-ms-flex-direction:column-reverse!important;flex-direction:column-reverse!important}.flex-xl-wrap{-ms-flex-wrap:wrap!important;flex-wrap:wrap!important}.flex-xl-nowrap{-ms-flex-wrap:nowrap!important;flex-wrap:nowrap!important}.flex-xl-wrap-reverse{-ms-flex-wrap:wrap-reverse!important;flex-wrap:wrap-reverse!important}.flex-xl-fill{-ms-flex:1 1 auto!important;flex:1 1 auto!important}.flex-xl-grow-0{-ms-flex-positive:0!important;flex-grow:0!important}.flex-xl-grow-1{-ms-flex-positive:1!important;flex-grow:1!important}.flex-xl-shrink-0{-ms-flex-negative:0!important;flex-shrink:0!important}.flex-xl-shrink-1{-ms-flex-negative:1!important;flex-shrink:1!important}.justify-content-xl-start{-ms-flex-pack:start!important;justify-content:flex-start!important}.justify-content-xl-end{-ms-flex-pack:end!important;justify-content:flex-end!important}.justify-content-xl-center{-ms-flex-pack:center!important;justify-content:center!important}.justify-content-xl-between{-ms-flex-pack:justify!important;justify-content:space-between!important}.justify-content-xl-around{-ms-flex-pack:distribute!important;justify-content:space-around!important}.align-items-xl-start{-ms-flex-align:start!important;align-items:flex-start!important}.align-items-xl-end{-ms-flex-align:end!important;align-items:flex-end!important}.align-items-xl-center{-ms-flex-align:center!important;align-items:center!important}.align-items-xl-baseline{-ms-flex-align:baseline!important;align-items:baseline!important}.align-items-xl-stretch{-ms-flex-align:stretch!important;align-items:stretch!important}.align-content-xl-start{-ms-flex-line-pack:start!important;align-content:flex-start!important}.align-content-xl-end{-ms-flex-line-pack:end!important;align-content:flex-end!important}.align-content-xl-center{-ms-flex-line-pack:center!important;align-content:center!important}.align-content-xl-between{-ms-flex-line-pack:justify!important;align-content:space-between!important}.align-content-xl-around{-ms-flex-line-pack:distribute!important;align-content:space-around!important}.align-content-xl-stretch{-ms-flex-line-pack:stretch!important;align-content:stretch!important}.align-self-xl-auto{-ms-flex-item-align:auto!important;align-self:auto!important}.align-self-xl-start{-ms-flex-item-align:start!important;align-self:flex-start!important}.align-self-xl-end{-ms-flex-item-align:end!important;align-self:flex-end!important}.align-self-xl-center{-ms-flex-item-align:center!important;align-self:center!important}.align-self-xl-baseline{-ms-flex-item-align:baseline!important;align-self:baseline!important}.align-self-xl-stretch{-ms-flex-item-align:stretch!important;align-self:stretch!important}}.float-left{float:left!important}.float-right{float:right!important}.float-none{float:none!important}@media (min-width:576px){.float-sm-left{float:left!important}.float-sm-right{float:right!important}.float-sm-none{float:none!important}}@media (min-width:768px){.float-md-left{float:left!important}.float-md-right{float:right!important}.float-md-none{float:none!important}}@media (min-width:992px){.float-lg-left{float:left!important}.float-lg-right{float:right!important}.float-lg-none{float:none!important}}@media (min-width:1200px){.float-xl-left{float:left!important}.float-xl-right{float:right!important}.float-xl-none{float:none!important}}.position-static{position:static!important}.position-relative{position:relative!important}.position-absolute{position:absolute!important}.position-fixed{position:fixed!important}.position-sticky{position:-webkit-sticky!important;position:sticky!important}.fixed-top{position:fixed;top:0;right:0;left:0;z-index:1030}.fixed-bottom{position:fixed;right:0;bottom:0;left:0;z-index:1030}@supports ((position:-webkit-sticky) or (position:sticky)){.sticky-top{position:-webkit-sticky;position:sticky;top:0;z-index:1020}}.sr-only{position:absolute;width:1px;height:1px;padding:0;overflow:hidden;clip:rect(0,0,0,0);white-space:nowrap;border:0}.sr-only-focusable:active,.sr-only-focusable:focus{position:static;width:auto;height:auto;overflow:visible;clip:auto;white-space:normal}.shadow-sm{box-shadow:0 .125rem .25rem rgba(0,0,0,.075)!important}.shadow{box-shadow:0 .5rem 1rem rgba(0,0,0,.15)!important}.shadow-lg{box-shadow:0 1rem 3rem rgba(0,0,0,.175)!important}.shadow-none{box-shadow:none!important}.w-25{width:25%!important}.w-50{width:50%!important}.w-75{width:75%!important}.w-100{width:100%!important}.w-auto{width:auto!important}.h-25{height:25%!important}.h-50{height:50%!important}.h-75{height:75%!important}.h-100{height:100%!important}.h-auto{height:auto!important}.mw-100{max-width:100%!important}.mh-100{max-height:100%!important}.m-0{margin:0!important}.mt-0,.my-0{margin-top:0!important}.mr-0,.mx-0{margin-right:0!important}.mb-0,.my-0{margin-bottom:0!important}.ml-0,.mx-0{margin-left:0!important}.m-1{margin:.25rem!important}.mt-1,.my-1{margin-top:.25rem!important}.mr-1,.mx-1{margin-right:.25rem!important}.mb-1,.my-1{margin-bottom:.25rem!important}.ml-1,.mx-1{margin-left:.25rem!important}.m-2{margin:.5rem!important}.mt-2,.my-2{margin-top:.5rem!important}.mr-2,.mx-2{margin-right:.5rem!important}.mb-2,.my-2{margin-bottom:.5rem!important}.ml-2,.mx-2{margin-left:.5rem!important}.m-3{margin:1rem!important}.mt-3,.my-3{margin-top:1rem!important}.mr-3,.mx-3{margin-right:1rem!important}.mb-3,.my-3{margin-bottom:1rem!important}.ml-3,.mx-3{margin-left:1rem!important}.m-4{margin:1.5rem!important}.mt-4,.my-4{margin-top:1.5rem!important}.mr-4,.mx-4{margin-right:1.5rem!important}.mb-4,.my-4{margin-bottom:1.5rem!important}.ml-4,.mx-4{margin-left:1.5rem!important}.m-5{margin:3rem!important}.mt-5,.my-5{margin-top:3rem!important}.mr-5,.mx-5{margin-right:3rem!important}.mb-5,.my-5{margin-bottom:3rem!important}.ml-5,.mx-5{margin-left:3rem!important}.p-0{padding:0!important}.pt-0,.py-0{padding-top:0!important}.pr-0,.px-0{padding-right:0!important}.pb-0,.py-0{padding-bottom:0!important}.pl-0,.px-0{padding-left:0!important}.p-1{padding:.25rem!important}.pt-1,.py-1{padding-top:.25rem!important}.pr-1,.px-1{padding-right:.25rem!important}.pb-1,.py-1{padding-bottom:.25rem!important}.pl-1,.px-1{padding-left:.25rem!important}.p-2{padding:.5rem!important}.pt-2,.py-2{padding-top:.5rem!important}.pr-2,.px-2{padding-right:.5rem!important}.pb-2,.py-2{padding-bottom:.5rem!important}.pl-2,.px-2{padding-left:.5rem!important}.p-3{padding:1rem!important}.pt-3,.py-3{padding-top:1rem!important}.pr-3,.px-3{padding-right:1rem!important}.pb-3,.py-3{padding-bottom:1rem!important}.pl-3,.px-3{padding-left:1rem!important}.p-4{padding:1.5rem!important}.pt-4,.py-4{padding-top:1.5rem!important}.pr-4,.px-4{padding-right:1.5rem!important}.pb-4,.py-4{padding-bottom:1.5rem!important}.pl-4,.px-4{padding-left:1.5rem!important}.p-5{padding:3rem!important}.pt-5,.py-5{padding-top:3rem!important}.pr-5,.px-5{padding-right:3rem!important}.pb-5,.py-5{padding-bottom:3rem!important}.pl-5,.px-5{padding-left:3rem!important}.m-auto{margin:auto!important}.mt-auto,.my-auto{margin-top:auto!important}.mr-auto,.mx-auto{margin-right:auto!important}.mb-auto,.my-auto{margin-bottom:auto!important}.ml-auto,.mx-auto{margin-left:auto!important}@media (min-width:576px){.m-sm-0{margin:0!important}.mt-sm-0,.my-sm-0{margin-top:0!important}.mr-sm-0,.mx-sm-0{margin-right:0!important}.mb-sm-0,.my-sm-0{margin-bottom:0!important}.ml-sm-0,.mx-sm-0{margin-left:0!important}.m-sm-1{margin:.25rem!important}.mt-sm-1,.my-sm-1{margin-top:.25rem!important}.mr-sm-1,.mx-sm-1{margin-right:.25rem!important}.mb-sm-1,.my-sm-1{margin-bottom:.25rem!important}.ml-sm-1,.mx-sm-1{margin-left:.25rem!important}.m-sm-2{margin:.5rem!important}.mt-sm-2,.my-sm-2{margin-top:.5rem!important}.mr-sm-2,.mx-sm-2{margin-right:.5rem!important}.mb-sm-2,.my-sm-2{margin-bottom:.5rem!important}.ml-sm-2,.mx-sm-2{margin-left:.5rem!important}.m-sm-3{margin:1rem!important}.mt-sm-3,.my-sm-3{margin-top:1rem!important}.mr-sm-3,.mx-sm-3{margin-right:1rem!important}.mb-sm-3,.my-sm-3{margin-bottom:1rem!important}.ml-sm-3,.mx-sm-3{margin-left:1rem!important}.m-sm-4{margin:1.5rem!important}.mt-sm-4,.my-sm-4{margin-top:1.5rem!important}.mr-sm-4,.mx-sm-4{margin-right:1.5rem!important}.mb-sm-4,.my-sm-4{margin-bottom:1.5rem!important}.ml-sm-4,.mx-sm-4{margin-left:1.5rem!important}.m-sm-5{margin:3rem!important}.mt-sm-5,.my-sm-5{margin-top:3rem!important}.mr-sm-5,.mx-sm-5{margin-right:3rem!important}.mb-sm-5,.my-sm-5{margin-bottom:3rem!important}.ml-sm-5,.mx-sm-5{margin-left:3rem!important}.p-sm-0{padding:0!important}.pt-sm-0,.py-sm-0{padding-top:0!important}.pr-sm-0,.px-sm-0{padding-right:0!important}.pb-sm-0,.py-sm-0{padding-bottom:0!important}.pl-sm-0,.px-sm-0{padding-left:0!important}.p-sm-1{padding:.25rem!important}.pt-sm-1,.py-sm-1{padding-top:.25rem!important}.pr-sm-1,.px-sm-1{padding-right:.25rem!important}.pb-sm-1,.py-sm-1{padding-bottom:.25rem!important}.pl-sm-1,.px-sm-1{padding-left:.25rem!important}.p-sm-2{padding:.5rem!important}.pt-sm-2,.py-sm-2{padding-top:.5rem!important}.pr-sm-2,.px-sm-2{padding-right:.5rem!important}.pb-sm-2,.py-sm-2{padding-bottom:.5rem!important}.pl-sm-2,.px-sm-2{padding-left:.5rem!important}.p-sm-3{padding:1rem!important}.pt-sm-3,.py-sm-3{padding-top:1rem!important}.pr-sm-3,.px-sm-3{padding-right:1rem!important}.pb-sm-3,.py-sm-3{padding-bottom:1rem!important}.pl-sm-3,.px-sm-3{padding-left:1rem!important}.p-sm-4{padding:1.5rem!important}.pt-sm-4,.py-sm-4{padding-top:1.5rem!important}.pr-sm-4,.px-sm-4{padding-right:1.5rem!important}.pb-sm-4,.py-sm-4{padding-bottom:1.5rem!important}.pl-sm-4,.px-sm-4{padding-left:1.5rem!important}.p-sm-5{padding:3rem!important}.pt-sm-5,.py-sm-5{padding-top:3rem!important}.pr-sm-5,.px-sm-5{padding-right:3rem!important}.pb-sm-5,.py-sm-5{padding-bottom:3rem!important}.pl-sm-5,.px-sm-5{padding-left:3rem!important}.m-sm-auto{margin:auto!important}.mt-sm-auto,.my-sm-auto{margin-top:auto!important}.mr-sm-auto,.mx-sm-auto{margin-right:auto!important}.mb-sm-auto,.my-sm-auto{margin-bottom:auto!important}.ml-sm-auto,.mx-sm-auto{margin-left:auto!important}}@media (min-width:768px){.m-md-0{margin:0!important}.mt-md-0,.my-md-0{margin-top:0!important}.mr-md-0,.mx-md-0{margin-right:0!important}.mb-md-0,.my-md-0{margin-bottom:0!important}.ml-md-0,.mx-md-0{margin-left:0!important}.m-md-1{margin:.25rem!important}.mt-md-1,.my-md-1{margin-top:.25rem!important}.mr-md-1,.mx-md-1{margin-right:.25rem!important}.mb-md-1,.my-md-1{margin-bottom:.25rem!important}.ml-md-1,.mx-md-1{margin-left:.25rem!important}.m-md-2{margin:.5rem!important}.mt-md-2,.my-md-2{margin-top:.5rem!important}.mr-md-2,.mx-md-2{margin-right:.5rem!important}.mb-md-2,.my-md-2{margin-bottom:.5rem!important}.ml-md-2,.mx-md-2{margin-left:.5rem!important}.m-md-3{margin:1rem!important}.mt-md-3,.my-md-3{margin-top:1rem!important}.mr-md-3,.mx-md-3{margin-right:1rem!important}.mb-md-3,.my-md-3{margin-bottom:1rem!important}.ml-md-3,.mx-md-3{margin-left:1rem!important}.m-md-4{margin:1.5rem!important}.mt-md-4,.my-md-4{margin-top:1.5rem!important}.mr-md-4,.mx-md-4{margin-right:1.5rem!important}.mb-md-4,.my-md-4{margin-bottom:1.5rem!important}.ml-md-4,.mx-md-4{margin-left:1.5rem!important}.m-md-5{margin:3rem!important}.mt-md-5,.my-md-5{margin-top:3rem!important}.mr-md-5,.mx-md-5{margin-right:3rem!important}.mb-md-5,.my-md-5{margin-bottom:3rem!important}.ml-md-5,.mx-md-5{margin-left:3rem!important}.p-md-0{padding:0!important}.pt-md-0,.py-md-0{padding-top:0!important}.pr-md-0,.px-md-0{padding-right:0!important}.pb-md-0,.py-md-0{padding-bottom:0!important}.pl-md-0,.px-md-0{padding-left:0!important}.p-md-1{padding:.25rem!important}.pt-md-1,.py-md-1{padding-top:.25rem!important}.pr-md-1,.px-md-1{padding-right:.25rem!important}.pb-md-1,.py-md-1{padding-bottom:.25rem!important}.pl-md-1,.px-md-1{padding-left:.25rem!important}.p-md-2{padding:.5rem!important}.pt-md-2,.py-md-2{padding-top:.5rem!important}.pr-md-2,.px-md-2{padding-right:.5rem!important}.pb-md-2,.py-md-2{padding-bottom:.5rem!important}.pl-md-2,.px-md-2{padding-left:.5rem!important}.p-md-3{padding:1rem!important}.pt-md-3,.py-md-3{padding-top:1rem!important}.pr-md-3,.px-md-3{padding-right:1rem!important}.pb-md-3,.py-md-3{padding-bottom:1rem!important}.pl-md-3,.px-md-3{padding-left:1rem!important}.p-md-4{padding:1.5rem!important}.pt-md-4,.py-md-4{padding-top:1.5rem!important}.pr-md-4,.px-md-4{padding-right:1.5rem!important}.pb-md-4,.py-md-4{padding-bottom:1.5rem!important}.pl-md-4,.px-md-4{padding-left:1.5rem!important}.p-md-5{padding:3rem!important}.pt-md-5,.py-md-5{padding-top:3rem!important}.pr-md-5,.px-md-5{padding-right:3rem!important}.pb-md-5,.py-md-5{padding-bottom:3rem!important}.pl-md-5,.px-md-5{padding-left:3rem!important}.m-md-auto{margin:auto!important}.mt-md-auto,.my-md-auto{margin-top:auto!important}.mr-md-auto,.mx-md-auto{margin-right:auto!important}.mb-md-auto,.my-md-auto{margin-bottom:auto!important}.ml-md-auto,.mx-md-auto{margin-left:auto!important}}@media (min-width:992px){.m-lg-0{margin:0!important}.mt-lg-0,.my-lg-0{margin-top:0!important}.mr-lg-0,.mx-lg-0{margin-right:0!important}.mb-lg-0,.my-lg-0{margin-bottom:0!important}.ml-lg-0,.mx-lg-0{margin-left:0!important}.m-lg-1{margin:.25rem!important}.mt-lg-1,.my-lg-1{margin-top:.25rem!important}.mr-lg-1,.mx-lg-1{margin-right:.25rem!important}.mb-lg-1,.my-lg-1{margin-bottom:.25rem!important}.ml-lg-1,.mx-lg-1{margin-left:.25rem!important}.m-lg-2{margin:.5rem!important}.mt-lg-2,.my-lg-2{margin-top:.5rem!important}.mr-lg-2,.mx-lg-2{margin-right:.5rem!important}.mb-lg-2,.my-lg-2{margin-bottom:.5rem!important}.ml-lg-2,.mx-lg-2{margin-left:.5rem!important}.m-lg-3{margin:1rem!important}.mt-lg-3,.my-lg-3{margin-top:1rem!important}.mr-lg-3,.mx-lg-3{margin-right:1rem!important}.mb-lg-3,.my-lg-3{margin-bottom:1rem!important}.ml-lg-3,.mx-lg-3{margin-left:1rem!important}.m-lg-4{margin:1.5rem!important}.mt-lg-4,.my-lg-4{margin-top:1.5rem!important}.mr-lg-4,.mx-lg-4{margin-right:1.5rem!important}.mb-lg-4,.my-lg-4{margin-bottom:1.5rem!important}.ml-lg-4,.mx-lg-4{margin-left:1.5rem!important}.m-lg-5{margin:3rem!important}.mt-lg-5,.my-lg-5{margin-top:3rem!important}.mr-lg-5,.mx-lg-5{margin-right:3rem!important}.mb-lg-5,.my-lg-5{margin-bottom:3rem!important}.ml-lg-5,.mx-lg-5{margin-left:3rem!important}.p-lg-0{padding:0!important}.pt-lg-0,.py-lg-0{padding-top:0!important}.pr-lg-0,.px-lg-0{padding-right:0!important}.pb-lg-0,.py-lg-0{padding-bottom:0!important}.pl-lg-0,.px-lg-0{padding-left:0!important}.p-lg-1{padding:.25rem!important}.pt-lg-1,.py-lg-1{padding-top:.25rem!important}.pr-lg-1,.px-lg-1{padding-right:.25rem!important}.pb-lg-1,.py-lg-1{padding-bottom:.25rem!important}.pl-lg-1,.px-lg-1{padding-left:.25rem!important}.p-lg-2{padding:.5rem!important}.pt-lg-2,.py-lg-2{padding-top:.5rem!important}.pr-lg-2,.px-lg-2{padding-right:.5rem!important}.pb-lg-2,.py-lg-2{padding-bottom:.5rem!important}.pl-lg-2,.px-lg-2{padding-left:.5rem!important}.p-lg-3{padding:1rem!important}.pt-lg-3,.py-lg-3{padding-top:1rem!important}.pr-lg-3,.px-lg-3{padding-right:1rem!important}.pb-lg-3,.py-lg-3{padding-bottom:1rem!important}.pl-lg-3,.px-lg-3{padding-left:1rem!important}.p-lg-4{padding:1.5rem!important}.pt-lg-4,.py-lg-4{padding-top:1.5rem!important}.pr-lg-4,.px-lg-4{padding-right:1.5rem!important}.pb-lg-4,.py-lg-4{padding-bottom:1.5rem!important}.pl-lg-4,.px-lg-4{padding-left:1.5rem!important}.p-lg-5{padding:3rem!important}.pt-lg-5,.py-lg-5{padding-top:3rem!important}.pr-lg-5,.px-lg-5{padding-right:3rem!important}.pb-lg-5,.py-lg-5{padding-bottom:3rem!important}.pl-lg-5,.px-lg-5{padding-left:3rem!important}.m-lg-auto{margin:auto!important}.mt-lg-auto,.my-lg-auto{margin-top:auto!important}.mr-lg-auto,.mx-lg-auto{margin-right:auto!important}.mb-lg-auto,.my-lg-auto{margin-bottom:auto!important}.ml-lg-auto,.mx-lg-auto{margin-left:auto!important}}@media (min-width:1200px){.m-xl-0{margin:0!important}.mt-xl-0,.my-xl-0{margin-top:0!important}.mr-xl-0,.mx-xl-0{margin-right:0!important}.mb-xl-0,.my-xl-0{margin-bottom:0!important}.ml-xl-0,.mx-xl-0{margin-left:0!important}.m-xl-1{margin:.25rem!important}.mt-xl-1,.my-xl-1{margin-top:.25rem!important}.mr-xl-1,.mx-xl-1{margin-right:.25rem!important}.mb-xl-1,.my-xl-1{margin-bottom:.25rem!important}.ml-xl-1,.mx-xl-1{margin-left:.25rem!important}.m-xl-2{margin:.5rem!important}.mt-xl-2,.my-xl-2{margin-top:.5rem!important}.mr-xl-2,.mx-xl-2{margin-right:.5rem!important}.mb-xl-2,.my-xl-2{margin-bottom:.5rem!important}.ml-xl-2,.mx-xl-2{margin-left:.5rem!important}.m-xl-3{margin:1rem!important}.mt-xl-3,.my-xl-3{margin-top:1rem!important}.mr-xl-3,.mx-xl-3{margin-right:1rem!important}.mb-xl-3,.my-xl-3{margin-bottom:1rem!important}.ml-xl-3,.mx-xl-3{margin-left:1rem!important}.m-xl-4{margin:1.5rem!important}.mt-xl-4,.my-xl-4{margin-top:1.5rem!important}.mr-xl-4,.mx-xl-4{margin-right:1.5rem!important}.mb-xl-4,.my-xl-4{margin-bottom:1.5rem!important}.ml-xl-4,.mx-xl-4{margin-left:1.5rem!important}.m-xl-5{margin:3rem!important}.mt-xl-5,.my-xl-5{margin-top:3rem!important}.mr-xl-5,.mx-xl-5{margin-right:3rem!important}.mb-xl-5,.my-xl-5{margin-bottom:3rem!important}.ml-xl-5,.mx-xl-5{margin-left:3rem!important}.p-xl-0{padding:0!important}.pt-xl-0,.py-xl-0{padding-top:0!important}.pr-xl-0,.px-xl-0{padding-right:0!important}.pb-xl-0,.py-xl-0{padding-bottom:0!important}.pl-xl-0,.px-xl-0{padding-left:0!important}.p-xl-1{padding:.25rem!important}.pt-xl-1,.py-xl-1{padding-top:.25rem!important}.pr-xl-1,.px-xl-1{padding-right:.25rem!important}.pb-xl-1,.py-xl-1{padding-bottom:.25rem!important}.pl-xl-1,.px-xl-1{padding-left:.25rem!important}.p-xl-2{padding:.5rem!important}.pt-xl-2,.py-xl-2{padding-top:.5rem!important}.pr-xl-2,.px-xl-2{padding-right:.5rem!important}.pb-xl-2,.py-xl-2{padding-bottom:.5rem!important}.pl-xl-2,.px-xl-2{padding-left:.5rem!important}.p-xl-3{padding:1rem!important}.pt-xl-3,.py-xl-3{padding-top:1rem!important}.pr-xl-3,.px-xl-3{padding-right:1rem!important}.pb-xl-3,.py-xl-3{padding-bottom:1rem!important}.pl-xl-3,.px-xl-3{padding-left:1rem!important}.p-xl-4{padding:1.5rem!important}.pt-xl-4,.py-xl-4{padding-top:1.5rem!important}.pr-xl-4,.px-xl-4{padding-right:1.5rem!important}.pb-xl-4,.py-xl-4{padding-bottom:1.5rem!important}.pl-xl-4,.px-xl-4{padding-left:1.5rem!important}.p-xl-5{padding:3rem!important}.pt-xl-5,.py-xl-5{padding-top:3rem!important}.pr-xl-5,.px-xl-5{padding-right:3rem!important}.pb-xl-5,.py-xl-5{padding-bottom:3rem!important}.pl-xl-5,.px-xl-5{padding-left:3rem!important}.m-xl-auto{margin:auto!important}.mt-xl-auto,.my-xl-auto{margin-top:auto!important}.mr-xl-auto,.mx-xl-auto{margin-right:auto!important}.mb-xl-auto,.my-xl-auto{margin-bottom:auto!important}.ml-xl-auto,.mx-xl-auto{margin-left:auto!important}}.text-monospace{font-family:SFMono-Regular,Menlo,Monaco,Consolas,"Liberation Mono","Courier New",monospace}.text-justify{text-align:justify!important}.text-nowrap{white-space:nowrap!important}.text-truncate{overflow:hidden;text-overflow:ellipsis;white-space:nowrap}.text-left{text-align:left!important}.text-right{text-align:right!important}.text-center{text-align:center!important}@media (min-width:576px){.text-sm-left{text-align:left!important}.text-sm-right{text-align:right!important}.text-sm-center{text-align:center!important}}@media (min-width:768px){.text-md-left{text-align:left!important}.text-md-right{text-align:right!important}.text-md-center{text-align:center!important}}@media (min-width:992px){.text-lg-left{text-align:left!important}.text-lg-right{text-align:right!important}.text-lg-center{text-align:center!important}}@media (min-width:1200px){.text-xl-left{text-align:left!important}.text-xl-right{text-align:right!important}.text-xl-center{text-align:center!important}}.text-lowercase{text-transform:lowercase!important}.text-uppercase{text-transform:uppercase!important}.text-capitalize{text-transform:capitalize!important}.font-weight-light{font-weight:300!important}.font-weight-normal{font-weight:400!important}.font-weight-bold{font-weight:700!important}.font-italic{font-style:italic!important}.text-white{color:#fff!important}.text-primary{color:#007bff!important}a.text-primary:focus,a.text-primary:hover{color:#0062cc!important}.text-secondary{color:#6c757d!important}a.text-secondary:focus,a.text-secondary:hover{color:#545b62!important}.text-success{color:#28a745!important}a.text-success:focus,a.text-success:hover{color:#1e7e34!important}.text-info{color:#17a2b8!important}a.text-info:focus,a.text-info:hover{color:#117a8b!important}.text-warning{color:#ffc107!important}a.text-warning:focus,a.text-warning:hover{color:#d39e00!important}.text-danger{color:#dc3545!important}a.text-danger:focus,a.text-danger:hover{color:#bd2130!important}.text-light{color:#f8f9fa!important}a.text-light:focus,a.text-light:hover{color:#dae0e5!important}.text-dark{color:#343a40!important}a.text-dark:focus,a.text-dark:hover{color:#1d2124!important}.text-body{color:#212529!important}.text-muted{color:#6c757d!important}.text-black-50{color:rgba(0,0,0,.5)!important}.text-white-50{color:rgba(255,255,255,.5)!important}.text-hide{font:0/0 a;color:transparent;text-shadow:none;background-color:transparent;border:0}.visible{visibility:visible!important}.invisible{visibility:hidden!important}@media print{*,::after,::before{text-shadow:none!important;box-shadow:none!important}a:not(.btn){text-decoration:underline}abbr[title]::after{content:" (" attr(title) ")"}pre{white-space:pre-wrap!important}blockquote,pre{border:1px solid #adb5bd;page-break-inside:avoid}thead{display:table-header-group}img,tr{page-break-inside:avoid}h2,h3,p{orphans:3;widows:3}h2,h3{page-break-after:avoid}@page{size:a3}body{min-width:992px!important}.container{min-width:992px!important}.navbar{display:none}.badge{border:1px solid #000}.table{border-collapse:collapse!important}.table td,.table th{background-color:#fff!important}.table-bordered td,.table-bordered th{border:1px solid #dee2e6!important}.table-dark{color:inherit}.table-dark tbody+tbody,.table-dark td,.table-dark th,.table-dark thead th{border-color:#dee2e6}.table .thead-dark th{color:inherit;border-color:#dee2e6}}
+/*# sourceMappingURL=bootstrap.min.css.map */
\ No newline at end of file
diff --git a/plugins/bootstrap/bootstrap.min.js b/plugins/bootstrap/bootstrap.min.js
new file mode 100644
index 00000000..9e495539
--- /dev/null
+++ b/plugins/bootstrap/bootstrap.min.js
@@ -0,0 +1,13 @@
+/*
+ Copyright (C) Federico Zivolo 2018
+ Distributed under the MIT License (license terms are at http://opensource.org/licenses/MIT).
+ */(function (e, t) { 'object' == typeof exports && 'undefined' != typeof module ? module.exports = t() : 'function' == typeof define && define.amd ? define(t) : e.Popper = t() })(this, function () { 'use strict'; function e(e) { return e && '[object Function]' === {}.toString.call(e) } function t(e, t) { if (1 !== e.nodeType) return []; var o = getComputedStyle(e, null); return t ? o[t] : o } function o(e) { return 'HTML' === e.nodeName ? e : e.parentNode || e.host } function n(e) { if (!e) return document.body; switch (e.nodeName) { case 'HTML': case 'BODY': return e.ownerDocument.body; case '#document': return e.body; }var i = t(e), r = i.overflow, p = i.overflowX, s = i.overflowY; return /(auto|scroll|overlay)/.test(r + s + p) ? e : n(o(e)) } function r(e) { return 11 === e ? re : 10 === e ? pe : re || pe } function p(e) { if (!e) return document.documentElement; for (var o = r(10) ? document.body : null, n = e.offsetParent; n === o && e.nextElementSibling;)n = (e = e.nextElementSibling).offsetParent; var i = n && n.nodeName; return i && 'BODY' !== i && 'HTML' !== i ? -1 !== ['TD', 'TABLE'].indexOf(n.nodeName) && 'static' === t(n, 'position') ? p(n) : n : e ? e.ownerDocument.documentElement : document.documentElement } function s(e) { var t = e.nodeName; return 'BODY' !== t && ('HTML' === t || p(e.firstElementChild) === e) } function d(e) { return null === e.parentNode ? e : d(e.parentNode) } function a(e, t) { if (!e || !e.nodeType || !t || !t.nodeType) return document.documentElement; var o = e.compareDocumentPosition(t) & Node.DOCUMENT_POSITION_FOLLOWING, n = o ? e : t, i = o ? t : e, r = document.createRange(); r.setStart(n, 0), r.setEnd(i, 0); var l = r.commonAncestorContainer; if (e !== l && t !== l || n.contains(i)) return s(l) ? l : p(l); var f = d(e); return f.host ? a(f.host, t) : a(e, d(t).host) } function l(e) { var t = 1 < arguments.length && void 0 !== arguments[1] ? arguments[1] : 'top', o = 'top' === t ? 'scrollTop' : 'scrollLeft', n = e.nodeName; if ('BODY' === n || 'HTML' === n) { var i = e.ownerDocument.documentElement, r = e.ownerDocument.scrollingElement || i; return r[o] } return e[o] } function f(e, t) { var o = 2 < arguments.length && void 0 !== arguments[2] && arguments[2], n = l(t, 'top'), i = l(t, 'left'), r = o ? -1 : 1; return e.top += n * r, e.bottom += n * r, e.left += i * r, e.right += i * r, e } function m(e, t) { var o = 'x' === t ? 'Left' : 'Top', n = 'Left' == o ? 'Right' : 'Bottom'; return parseFloat(e['border' + o + 'Width'], 10) + parseFloat(e['border' + n + 'Width'], 10) } function h(e, t, o, n) { return $(t['offset' + e], t['scroll' + e], o['client' + e], o['offset' + e], o['scroll' + e], r(10) ? o['offset' + e] + n['margin' + ('Height' === e ? 'Top' : 'Left')] + n['margin' + ('Height' === e ? 'Bottom' : 'Right')] : 0) } function c() { var e = document.body, t = document.documentElement, o = r(10) && getComputedStyle(t); return { height: h('Height', e, t, o), width: h('Width', e, t, o) } } function g(e) { return le({}, e, { right: e.left + e.width, bottom: e.top + e.height }) } function u(e) { var o = {}; try { if (r(10)) { o = e.getBoundingClientRect(); var n = l(e, 'top'), i = l(e, 'left'); o.top += n, o.left += i, o.bottom += n, o.right += i } else o = e.getBoundingClientRect() } catch (t) { } var p = { left: o.left, top: o.top, width: o.right - o.left, height: o.bottom - o.top }, s = 'HTML' === e.nodeName ? c() : {}, d = s.width || e.clientWidth || p.right - p.left, a = s.height || e.clientHeight || p.bottom - p.top, f = e.offsetWidth - d, h = e.offsetHeight - a; if (f || h) { var u = t(e); f -= m(u, 'x'), h -= m(u, 'y'), p.width -= f, p.height -= h } return g(p) } function b(e, o) { var i = 2 < arguments.length && void 0 !== arguments[2] && arguments[2], p = r(10), s = 'HTML' === o.nodeName, d = u(e), a = u(o), l = n(e), m = t(o), h = parseFloat(m.borderTopWidth, 10), c = parseFloat(m.borderLeftWidth, 10); i && 'HTML' === o.nodeName && (a.top = $(a.top, 0), a.left = $(a.left, 0)); var b = g({ top: d.top - a.top - h, left: d.left - a.left - c, width: d.width, height: d.height }); if (b.marginTop = 0, b.marginLeft = 0, !p && s) { var y = parseFloat(m.marginTop, 10), w = parseFloat(m.marginLeft, 10); b.top -= h - y, b.bottom -= h - y, b.left -= c - w, b.right -= c - w, b.marginTop = y, b.marginLeft = w } return (p && !i ? o.contains(l) : o === l && 'BODY' !== l.nodeName) && (b = f(b, o)), b } function y(e) { var t = 1 < arguments.length && void 0 !== arguments[1] && arguments[1], o = e.ownerDocument.documentElement, n = b(e, o), i = $(o.clientWidth, window.innerWidth || 0), r = $(o.clientHeight, window.innerHeight || 0), p = t ? 0 : l(o), s = t ? 0 : l(o, 'left'), d = { top: p - n.top + n.marginTop, left: s - n.left + n.marginLeft, width: i, height: r }; return g(d) } function w(e) { var n = e.nodeName; return 'BODY' === n || 'HTML' === n ? !1 : 'fixed' === t(e, 'position') || w(o(e)) } function E(e) { if (!e || !e.parentElement || r()) return document.documentElement; for (var o = e.parentElement; o && 'none' === t(o, 'transform');)o = o.parentElement; return o || document.documentElement } function v(e, t, i, r) { var p = 4 < arguments.length && void 0 !== arguments[4] && arguments[4], s = { top: 0, left: 0 }, d = p ? E(e) : a(e, t); if ('viewport' === r) s = y(d, p); else { var l; 'scrollParent' === r ? (l = n(o(t)), 'BODY' === l.nodeName && (l = e.ownerDocument.documentElement)) : 'window' === r ? l = e.ownerDocument.documentElement : l = r; var f = b(l, d, p); if ('HTML' === l.nodeName && !w(d)) { var m = c(), h = m.height, g = m.width; s.top += f.top - f.marginTop, s.bottom = h + f.top, s.left += f.left - f.marginLeft, s.right = g + f.left } else s = f } return s.left += i, s.top += i, s.right -= i, s.bottom -= i, s } function x(e) { var t = e.width, o = e.height; return t * o } function O(e, t, o, n, i) { var r = 5 < arguments.length && void 0 !== arguments[5] ? arguments[5] : 0; if (-1 === e.indexOf('auto')) return e; var p = v(o, n, r, i), s = { top: { width: p.width, height: t.top - p.top }, right: { width: p.right - t.right, height: p.height }, bottom: { width: p.width, height: p.bottom - t.bottom }, left: { width: t.left - p.left, height: p.height } }, d = Object.keys(s).map(function (e) { return le({ key: e }, s[e], { area: x(s[e]) }) }).sort(function (e, t) { return t.area - e.area }), a = d.filter(function (e) { var t = e.width, n = e.height; return t >= o.clientWidth && n >= o.clientHeight }), l = 0 < a.length ? a[0].key : d[0].key, f = e.split('-')[1]; return l + (f ? '-' + f : '') } function L(e, t, o) { var n = 3 < arguments.length && void 0 !== arguments[3] ? arguments[3] : null, i = n ? E(t) : a(t, o); return b(o, i, n) } function S(e) { var t = getComputedStyle(e), o = parseFloat(t.marginTop) + parseFloat(t.marginBottom), n = parseFloat(t.marginLeft) + parseFloat(t.marginRight), i = { width: e.offsetWidth + n, height: e.offsetHeight + o }; return i } function T(e) { var t = { left: 'right', right: 'left', bottom: 'top', top: 'bottom' }; return e.replace(/left|right|bottom|top/g, function (e) { return t[e] }) } function C(e, t, o) { o = o.split('-')[0]; var n = S(e), i = { width: n.width, height: n.height }, r = -1 !== ['right', 'left'].indexOf(o), p = r ? 'top' : 'left', s = r ? 'left' : 'top', d = r ? 'height' : 'width', a = r ? 'width' : 'height'; return i[p] = t[p] + t[d] / 2 - n[d] / 2, i[s] = o === s ? t[s] - n[a] : t[T(s)], i } function D(e, t) { return Array.prototype.find ? e.find(t) : e.filter(t)[0] } function N(e, t, o) { if (Array.prototype.findIndex) return e.findIndex(function (e) { return e[t] === o }); var n = D(e, function (e) { return e[t] === o }); return e.indexOf(n) } function P(t, o, n) { var i = void 0 === n ? t : t.slice(0, N(t, 'name', n)); return i.forEach(function (t) { t['function'] && console.warn('`modifier.function` is deprecated, use `modifier.fn`!'); var n = t['function'] || t.fn; t.enabled && e(n) && (o.offsets.popper = g(o.offsets.popper), o.offsets.reference = g(o.offsets.reference), o = n(o, t)) }), o } function k() { if (!this.state.isDestroyed) { var e = { instance: this, styles: {}, arrowStyles: {}, attributes: {}, flipped: !1, offsets: {} }; e.offsets.reference = L(this.state, this.popper, this.reference, this.options.positionFixed), e.placement = O(this.options.placement, e.offsets.reference, this.popper, this.reference, this.options.modifiers.flip.boundariesElement, this.options.modifiers.flip.padding), e.originalPlacement = e.placement, e.positionFixed = this.options.positionFixed, e.offsets.popper = C(this.popper, e.offsets.reference, e.placement), e.offsets.popper.position = this.options.positionFixed ? 'fixed' : 'absolute', e = P(this.modifiers, e), this.state.isCreated ? this.options.onUpdate(e) : (this.state.isCreated = !0, this.options.onCreate(e)) } } function W(e, t) { return e.some(function (e) { var o = e.name, n = e.enabled; return n && o === t }) } function B(e) { for (var t = [!1, 'ms', 'Webkit', 'Moz', 'O'], o = e.charAt(0).toUpperCase() + e.slice(1), n = 0; n < t.length; n++) { var i = t[n], r = i ? '' + i + o : e; if ('undefined' != typeof document.body.style[r]) return r } return null } function H() { return this.state.isDestroyed = !0, W(this.modifiers, 'applyStyle') && (this.popper.removeAttribute('x-placement'), this.popper.style.position = '', this.popper.style.top = '', this.popper.style.left = '', this.popper.style.right = '', this.popper.style.bottom = '', this.popper.style.willChange = '', this.popper.style[B('transform')] = ''), this.disableEventListeners(), this.options.removeOnDestroy && this.popper.parentNode.removeChild(this.popper), this } function A(e) { var t = e.ownerDocument; return t ? t.defaultView : window } function M(e, t, o, i) { var r = 'BODY' === e.nodeName, p = r ? e.ownerDocument.defaultView : e; p.addEventListener(t, o, { passive: !0 }), r || M(n(p.parentNode), t, o, i), i.push(p) } function I(e, t, o, i) { o.updateBound = i, A(e).addEventListener('resize', o.updateBound, { passive: !0 }); var r = n(e); return M(r, 'scroll', o.updateBound, o.scrollParents), o.scrollElement = r, o.eventsEnabled = !0, o } function F() { this.state.eventsEnabled || (this.state = I(this.reference, this.options, this.state, this.scheduleUpdate)) } function R(e, t) { return A(e).removeEventListener('resize', t.updateBound), t.scrollParents.forEach(function (e) { e.removeEventListener('scroll', t.updateBound) }), t.updateBound = null, t.scrollParents = [], t.scrollElement = null, t.eventsEnabled = !1, t } function U() { this.state.eventsEnabled && (cancelAnimationFrame(this.scheduleUpdate), this.state = R(this.reference, this.state)) } function Y(e) { return '' !== e && !isNaN(parseFloat(e)) && isFinite(e) } function j(e, t) { Object.keys(t).forEach(function (o) { var n = ''; -1 !== ['width', 'height', 'top', 'right', 'bottom', 'left'].indexOf(o) && Y(t[o]) && (n = 'px'), e.style[o] = t[o] + n }) } function K(e, t) { Object.keys(t).forEach(function (o) { var n = t[o]; !1 === n ? e.removeAttribute(o) : e.setAttribute(o, t[o]) }) } function q(e, t, o) { var n = D(e, function (e) { var o = e.name; return o === t }), i = !!n && e.some(function (e) { return e.name === o && e.enabled && e.order < n.order }); if (!i) { var r = '`' + t + '`'; console.warn('`' + o + '`' + ' modifier is required by ' + r + ' modifier in order to work, be sure to include it before ' + r + '!') } return i } function G(e) { return 'end' === e ? 'start' : 'start' === e ? 'end' : e } function z(e) { var t = 1 < arguments.length && void 0 !== arguments[1] && arguments[1], o = me.indexOf(e), n = me.slice(o + 1).concat(me.slice(0, o)); return t ? n.reverse() : n } function V(e, t, o, n) { var i = e.match(/((?:\-|\+)?\d*\.?\d*)(.*)/), r = +i[1], p = i[2]; if (!r) return e; if (0 === p.indexOf('%')) { var s; switch (p) { case '%p': s = o; break; case '%': case '%r': default: s = n; }var d = g(s); return d[t] / 100 * r } if ('vh' === p || 'vw' === p) { var a; return a = 'vh' === p ? $(document.documentElement.clientHeight, window.innerHeight || 0) : $(document.documentElement.clientWidth, window.innerWidth || 0), a / 100 * r } return r } function _(e, t, o, n) { var i = [0, 0], r = -1 !== ['right', 'left'].indexOf(n), p = e.split(/(\+|\-)/).map(function (e) { return e.trim() }), s = p.indexOf(D(p, function (e) { return -1 !== e.search(/,|\s/) })); p[s] && -1 === p[s].indexOf(',') && console.warn('Offsets separated by white space(s) are deprecated, use a comma (,) instead.'); var d = /\s*,\s*|\s+/, a = -1 === s ? [p] : [p.slice(0, s).concat([p[s].split(d)[0]]), [p[s].split(d)[1]].concat(p.slice(s + 1))]; return a = a.map(function (e, n) { var i = (1 === n ? !r : r) ? 'height' : 'width', p = !1; return e.reduce(function (e, t) { return '' === e[e.length - 1] && -1 !== ['+', '-'].indexOf(t) ? (e[e.length - 1] = t, p = !0, e) : p ? (e[e.length - 1] += t, p = !1, e) : e.concat(t) }, []).map(function (e) { return V(e, i, t, o) }) }), a.forEach(function (e, t) { e.forEach(function (o, n) { Y(o) && (i[t] += o * ('-' === e[n - 1] ? -1 : 1)) }) }), i } function X(e, t) { var o, n = t.offset, i = e.placement, r = e.offsets, p = r.popper, s = r.reference, d = i.split('-')[0]; return o = Y(+n) ? [+n, 0] : _(n, p, s, d), 'left' === d ? (p.top += o[0], p.left -= o[1]) : 'right' === d ? (p.top += o[0], p.left += o[1]) : 'top' === d ? (p.left += o[0], p.top -= o[1]) : 'bottom' === d && (p.left += o[0], p.top += o[1]), e.popper = p, e } for (var J = Math.min, Q = Math.round, Z = Math.floor, $ = Math.max, ee = 'undefined' != typeof window && 'undefined' != typeof document, te = ['Edge', 'Trident', 'Firefox'], oe = 0, ne = 0; ne < te.length; ne += 1)if (ee && 0 <= navigator.userAgent.indexOf(te[ne])) { oe = 1; break } var i = ee && window.Promise, ie = i ? function (e) { var t = !1; return function () { t || (t = !0, window.Promise.resolve().then(function () { t = !1, e() })) } } : function (e) { var t = !1; return function () { t || (t = !0, setTimeout(function () { t = !1, e() }, oe)) } }, re = ee && !!(window.MSInputMethodContext && document.documentMode), pe = ee && /MSIE 10/.test(navigator.userAgent), se = function (e, t) { if (!(e instanceof t)) throw new TypeError('Cannot call a class as a function') }, de = function () { function e(e, t) { for (var o, n = 0; n < t.length; n++)o = t[n], o.enumerable = o.enumerable || !1, o.configurable = !0, 'value' in o && (o.writable = !0), Object.defineProperty(e, o.key, o) } return function (t, o, n) { return o && e(t.prototype, o), n && e(t, n), t } }(), ae = function (e, t, o) { return t in e ? Object.defineProperty(e, t, { value: o, enumerable: !0, configurable: !0, writable: !0 }) : e[t] = o, e }, le = Object.assign || function (e) { for (var t, o = 1; o < arguments.length; o++)for (var n in t = arguments[o], t) Object.prototype.hasOwnProperty.call(t, n) && (e[n] = t[n]); return e }, fe = ['auto-start', 'auto', 'auto-end', 'top-start', 'top', 'top-end', 'right-start', 'right', 'right-end', 'bottom-end', 'bottom', 'bottom-start', 'left-end', 'left', 'left-start'], me = fe.slice(3), he = { FLIP: 'flip', CLOCKWISE: 'clockwise', COUNTERCLOCKWISE: 'counterclockwise' }, ce = function () { function t(o, n) { var i = this, r = 2 < arguments.length && void 0 !== arguments[2] ? arguments[2] : {}; se(this, t), this.scheduleUpdate = function () { return requestAnimationFrame(i.update) }, this.update = ie(this.update.bind(this)), this.options = le({}, t.Defaults, r), this.state = { isDestroyed: !1, isCreated: !1, scrollParents: [] }, this.reference = o && o.jquery ? o[0] : o, this.popper = n && n.jquery ? n[0] : n, this.options.modifiers = {}, Object.keys(le({}, t.Defaults.modifiers, r.modifiers)).forEach(function (e) { i.options.modifiers[e] = le({}, t.Defaults.modifiers[e] || {}, r.modifiers ? r.modifiers[e] : {}) }), this.modifiers = Object.keys(this.options.modifiers).map(function (e) { return le({ name: e }, i.options.modifiers[e]) }).sort(function (e, t) { return e.order - t.order }), this.modifiers.forEach(function (t) { t.enabled && e(t.onLoad) && t.onLoad(i.reference, i.popper, i.options, t, i.state) }), this.update(); var p = this.options.eventsEnabled; p && this.enableEventListeners(), this.state.eventsEnabled = p } return de(t, [{ key: 'update', value: function () { return k.call(this) } }, { key: 'destroy', value: function () { return H.call(this) } }, { key: 'enableEventListeners', value: function () { return F.call(this) } }, { key: 'disableEventListeners', value: function () { return U.call(this) } }]), t }(); return ce.Utils = ('undefined' == typeof window ? global : window).PopperUtils, ce.placements = fe, ce.Defaults = { placement: 'bottom', positionFixed: !1, eventsEnabled: !0, removeOnDestroy: !1, onCreate: function () { }, onUpdate: function () { }, modifiers: { shift: { order: 100, enabled: !0, fn: function (e) { var t = e.placement, o = t.split('-')[0], n = t.split('-')[1]; if (n) { var i = e.offsets, r = i.reference, p = i.popper, s = -1 !== ['bottom', 'top'].indexOf(o), d = s ? 'left' : 'top', a = s ? 'width' : 'height', l = { start: ae({}, d, r[d]), end: ae({}, d, r[d] + r[a] - p[a]) }; e.offsets.popper = le({}, p, l[n]) } return e } }, offset: { order: 200, enabled: !0, fn: X, offset: 0 }, preventOverflow: { order: 300, enabled: !0, fn: function (e, t) { var o = t.boundariesElement || p(e.instance.popper); e.instance.reference === o && (o = p(o)); var n = B('transform'), i = e.instance.popper.style, r = i.top, s = i.left, d = i[n]; i.top = '', i.left = '', i[n] = ''; var a = v(e.instance.popper, e.instance.reference, t.padding, o, e.positionFixed); i.top = r, i.left = s, i[n] = d, t.boundaries = a; var l = t.priority, f = e.offsets.popper, m = { primary: function (e) { var o = f[e]; return f[e] < a[e] && !t.escapeWithReference && (o = $(f[e], a[e])), ae({}, e, o) }, secondary: function (e) { var o = 'right' === e ? 'left' : 'top', n = f[o]; return f[e] > a[e] && !t.escapeWithReference && (n = J(f[o], a[e] - ('right' === e ? f.width : f.height))), ae({}, o, n) } }; return l.forEach(function (e) { var t = -1 === ['left', 'top'].indexOf(e) ? 'secondary' : 'primary'; f = le({}, f, m[t](e)) }), e.offsets.popper = f, e }, priority: ['left', 'right', 'top', 'bottom'], padding: 5, boundariesElement: 'scrollParent' }, keepTogether: { order: 400, enabled: !0, fn: function (e) { var t = e.offsets, o = t.popper, n = t.reference, i = e.placement.split('-')[0], r = Z, p = -1 !== ['top', 'bottom'].indexOf(i), s = p ? 'right' : 'bottom', d = p ? 'left' : 'top', a = p ? 'width' : 'height'; return o[s] < r(n[d]) && (e.offsets.popper[d] = r(n[d]) - o[a]), o[d] > r(n[s]) && (e.offsets.popper[d] = r(n[s])), e } }, arrow: { order: 500, enabled: !0, fn: function (e, o) { var n; if (!q(e.instance.modifiers, 'arrow', 'keepTogether')) return e; var i = o.element; if ('string' == typeof i) { if (i = e.instance.popper.querySelector(i), !i) return e; } else if (!e.instance.popper.contains(i)) return console.warn('WARNING: `arrow.element` must be child of its popper element!'), e; var r = e.placement.split('-')[0], p = e.offsets, s = p.popper, d = p.reference, a = -1 !== ['left', 'right'].indexOf(r), l = a ? 'height' : 'width', f = a ? 'Top' : 'Left', m = f.toLowerCase(), h = a ? 'left' : 'top', c = a ? 'bottom' : 'right', u = S(i)[l]; d[c] - u < s[m] && (e.offsets.popper[m] -= s[m] - (d[c] - u)), d[m] + u > s[c] && (e.offsets.popper[m] += d[m] + u - s[c]), e.offsets.popper = g(e.offsets.popper); var b = d[m] + d[l] / 2 - u / 2, y = t(e.instance.popper), w = parseFloat(y['margin' + f], 10), E = parseFloat(y['border' + f + 'Width'], 10), v = b - e.offsets.popper[m] - w - E; return v = $(J(s[l] - u, v), 0), e.arrowElement = i, e.offsets.arrow = (n = {}, ae(n, m, Q(v)), ae(n, h, ''), n), e }, element: '[x-arrow]' }, flip: { order: 600, enabled: !0, fn: function (e, t) { if (W(e.instance.modifiers, 'inner')) return e; if (e.flipped && e.placement === e.originalPlacement) return e; var o = v(e.instance.popper, e.instance.reference, t.padding, t.boundariesElement, e.positionFixed), n = e.placement.split('-')[0], i = T(n), r = e.placement.split('-')[1] || '', p = []; switch (t.behavior) { case he.FLIP: p = [n, i]; break; case he.CLOCKWISE: p = z(n); break; case he.COUNTERCLOCKWISE: p = z(n, !0); break; default: p = t.behavior; }return p.forEach(function (s, d) { if (n !== s || p.length === d + 1) return e; n = e.placement.split('-')[0], i = T(n); var a = e.offsets.popper, l = e.offsets.reference, f = Z, m = 'left' === n && f(a.right) > f(l.left) || 'right' === n && f(a.left) < f(l.right) || 'top' === n && f(a.bottom) > f(l.top) || 'bottom' === n && f(a.top) < f(l.bottom), h = f(a.left) < f(o.left), c = f(a.right) > f(o.right), g = f(a.top) < f(o.top), u = f(a.bottom) > f(o.bottom), b = 'left' === n && h || 'right' === n && c || 'top' === n && g || 'bottom' === n && u, y = -1 !== ['top', 'bottom'].indexOf(n), w = !!t.flipVariations && (y && 'start' === r && h || y && 'end' === r && c || !y && 'start' === r && g || !y && 'end' === r && u); (m || b || w) && (e.flipped = !0, (m || b) && (n = p[d + 1]), w && (r = G(r)), e.placement = n + (r ? '-' + r : ''), e.offsets.popper = le({}, e.offsets.popper, C(e.instance.popper, e.offsets.reference, e.placement)), e = P(e.instance.modifiers, e, 'flip')) }), e }, behavior: 'flip', padding: 5, boundariesElement: 'viewport' }, inner: { order: 700, enabled: !1, fn: function (e) { var t = e.placement, o = t.split('-')[0], n = e.offsets, i = n.popper, r = n.reference, p = -1 !== ['left', 'right'].indexOf(o), s = -1 === ['top', 'left'].indexOf(o); return i[p ? 'left' : 'top'] = r[o] - (s ? i[p ? 'width' : 'height'] : 0), e.placement = T(t), e.offsets.popper = g(i), e } }, hide: { order: 800, enabled: !0, fn: function (e) { if (!q(e.instance.modifiers, 'hide', 'preventOverflow')) return e; var t = e.offsets.reference, o = D(e.instance.modifiers, function (e) { return 'preventOverflow' === e.name }).boundaries; if (t.bottom < o.top || t.left > o.right || t.top > o.bottom || t.right < o.left) { if (!0 === e.hide) return e; e.hide = !0, e.attributes['x-out-of-boundaries'] = '' } else { if (!1 === e.hide) return e; e.hide = !1, e.attributes['x-out-of-boundaries'] = !1 } return e } }, computeStyle: { order: 850, enabled: !0, fn: function (e, t) { var o = t.x, n = t.y, i = e.offsets.popper, r = D(e.instance.modifiers, function (e) { return 'applyStyle' === e.name }).gpuAcceleration; void 0 !== r && console.warn('WARNING: `gpuAcceleration` option moved to `computeStyle` modifier and will not be supported in future versions of Popper.js!'); var s, d, a = void 0 === r ? t.gpuAcceleration : r, l = p(e.instance.popper), f = u(l), m = { position: i.position }, h = { left: Z(i.left), top: Q(i.top), bottom: Q(i.bottom), right: Z(i.right) }, c = 'bottom' === o ? 'top' : 'bottom', g = 'right' === n ? 'left' : 'right', b = B('transform'); if (d = 'bottom' == c ? -f.height + h.bottom : h.top, s = 'right' == g ? -f.width + h.right : h.left, a && b) m[b] = 'translate3d(' + s + 'px, ' + d + 'px, 0)', m[c] = 0, m[g] = 0, m.willChange = 'transform'; else { var y = 'bottom' == c ? -1 : 1, w = 'right' == g ? -1 : 1; m[c] = d * y, m[g] = s * w, m.willChange = c + ', ' + g } var E = { "x-placement": e.placement }; return e.attributes = le({}, E, e.attributes), e.styles = le({}, m, e.styles), e.arrowStyles = le({}, e.offsets.arrow, e.arrowStyles), e }, gpuAcceleration: !0, x: 'bottom', y: 'right' }, applyStyle: { order: 900, enabled: !0, fn: function (e) { return j(e.instance.popper, e.styles), K(e.instance.popper, e.attributes), e.arrowElement && Object.keys(e.arrowStyles).length && j(e.arrowElement, e.arrowStyles), e }, onLoad: function (e, t, o, n, i) { var r = L(i, t, e, o.positionFixed), p = O(o.placement, r, t, e, o.modifiers.flip.boundariesElement, o.modifiers.flip.padding); return t.setAttribute('x-placement', p), j(t, { position: o.positionFixed ? 'fixed' : 'absolute' }), o }, gpuAcceleration: void 0 } } }, ce });
+//# sourceMappingURL=popper.min.js.map
+
+/*!
+  * Bootstrap v4.1.1 (https://getbootstrap.com/)
+  * Copyright 2011-2018 The Bootstrap Authors (https://github.com/twbs/bootstrap/graphs/contributors)
+  * Licensed under MIT (https://github.com/twbs/bootstrap/blob/master/LICENSE)
+  */
+!function (t, e) { "object" == typeof exports && "undefined" != typeof module ? e(exports, require("jquery"), require("popper.js")) : "function" == typeof define && define.amd ? define(["exports", "jquery", "popper.js"], e) : e(t.bootstrap = {}, t.jQuery, t.Popper) }(this, function (t, e, c) { "use strict"; function i(t, e) { for (var n = 0; n < e.length; n++) { var i = e[n]; i.enumerable = i.enumerable || !1, i.configurable = !0, "value" in i && (i.writable = !0), Object.defineProperty(t, i.key, i) } } function o(t, e, n) { return e && i(t.prototype, e), n && i(t, n), t } function h(r) { for (var t = 1; t < arguments.length; t++) { var s = null != arguments[t] ? arguments[t] : {}, e = Object.keys(s); "function" == typeof Object.getOwnPropertySymbols && (e = e.concat(Object.getOwnPropertySymbols(s).filter(function (t) { return Object.getOwnPropertyDescriptor(s, t).enumerable }))), e.forEach(function (t) { var e, n, i; e = r, i = s[n = t], n in e ? Object.defineProperty(e, n, { value: i, enumerable: !0, configurable: !0, writable: !0 }) : e[n] = i }) } return r } e = e && e.hasOwnProperty("default") ? e.default : e, c = c && c.hasOwnProperty("default") ? c.default : c; var r, n, s, a, l, u, f, d, _, g, m, p, v, E, y, T, C, I, A, D, b, S, w, N, O, k, P, L, j, R, H, W, M, x, U, K, F, V, Q, B, Y, G, q, z, X, J, Z, $, tt, et, nt, it, rt, st, ot, at, lt, ht, ct, ut, ft, dt, _t, gt, mt, pt, vt, Et, yt, Tt, Ct, It, At, Dt, bt, St, wt, Nt, Ot, kt, Pt, Lt, jt, Rt, Ht, Wt, Mt, xt, Ut, Kt, Ft, Vt, Qt, Bt, Yt, Gt, qt, zt, Xt, Jt, Zt, $t, te, ee, ne, ie, re, se, oe, ae, le, he, ce, ue, fe, de, _e, ge, me, pe, ve, Ee, ye, Te, Ce, Ie, Ae, De, be, Se, we, Ne, Oe, ke, Pe, Le, je, Re, He, We, Me, xe, Ue, Ke, Fe, Ve, Qe, Be, Ye, Ge, qe, ze, Xe, Je, Ze, $e, tn, en, nn, rn, sn, on, an, ln, hn, cn, un, fn, dn, _n, gn, mn, pn, vn, En, yn, Tn, Cn = function (i) { var e = "transitionend"; function t(t) { var e = this, n = !1; return i(this).one(l.TRANSITION_END, function () { n = !0 }), setTimeout(function () { n || l.triggerTransitionEnd(e) }, t), this } var l = { TRANSITION_END: "bsTransitionEnd", getUID: function (t) { for (; t += ~~(1e6 * Math.random()), document.getElementById(t);); return t }, getSelectorFromElement: function (t) { var e = t.getAttribute("data-target"); e && "#" !== e || (e = t.getAttribute("href") || ""); try { return 0 < i(document).find(e).length ? e : null } catch (t) { return null } }, getTransitionDurationFromElement: function (t) { if (!t) return 0; var e = i(t).css("transition-duration"); return parseFloat(e) ? (e = e.split(",")[0], 1e3 * parseFloat(e)) : 0 }, reflow: function (t) { return t.offsetHeight }, triggerTransitionEnd: function (t) { i(t).trigger(e) }, supportsTransitionEnd: function () { return Boolean(e) }, isElement: function (t) { return (t[0] || t).nodeType }, typeCheckConfig: function (t, e, n) { for (var i in n) if (Object.prototype.hasOwnProperty.call(n, i)) { var r = n[i], s = e[i], o = s && l.isElement(s) ? "element" : (a = s, {}.toString.call(a).match(/\s([a-z]+)/i)[1].toLowerCase()); if (!new RegExp(r).test(o)) throw new Error(t.toUpperCase() + ': Option "' + i + '" provided type "' + o + '" but expected type "' + r + '".') } var a } }; return i.fn.emulateTransitionEnd = t, i.event.special[l.TRANSITION_END] = { bindType: e, delegateType: e, handle: function (t) { if (i(t.target).is(this)) return t.handleObj.handler.apply(this, arguments) } }, l }(e), In = (n = "alert", a = "." + (s = "bs.alert"), l = (r = e).fn[n], u = { CLOSE: "close" + a, CLOSED: "closed" + a, CLICK_DATA_API: "click" + a + ".data-api" }, f = "alert", d = "fade", _ = "show", g = function () { function i(t) { this._element = t } var t = i.prototype; return t.close = function (t) { var e = this._element; t && (e = this._getRootElement(t)), this._triggerCloseEvent(e).isDefaultPrevented() || this._removeElement(e) }, t.dispose = function () { r.removeData(this._element, s), this._element = null }, t._getRootElement = function (t) { var e = Cn.getSelectorFromElement(t), n = !1; return e && (n = r(e)[0]), n || (n = r(t).closest("." + f)[0]), n }, t._triggerCloseEvent = function (t) { var e = r.Event(u.CLOSE); return r(t).trigger(e), e }, t._removeElement = function (e) { var n = this; if (r(e).removeClass(_), r(e).hasClass(d)) { var t = Cn.getTransitionDurationFromElement(e); r(e).one(Cn.TRANSITION_END, function (t) { return n._destroyElement(e, t) }).emulateTransitionEnd(t) } else this._destroyElement(e) }, t._destroyElement = function (t) { r(t).detach().trigger(u.CLOSED).remove() }, i._jQueryInterface = function (n) { return this.each(function () { var t = r(this), e = t.data(s); e || (e = new i(this), t.data(s, e)), "close" === n && e[n](this) }) }, i._handleDismiss = function (e) { return function (t) { t && t.preventDefault(), e.close(this) } }, o(i, null, [{ key: "VERSION", get: function () { return "4.1.1" } }]), i }(), r(document).on(u.CLICK_DATA_API, '[data-dismiss="alert"]', g._handleDismiss(new g)), r.fn[n] = g._jQueryInterface, r.fn[n].Constructor = g, r.fn[n].noConflict = function () { return r.fn[n] = l, g._jQueryInterface }, g), An = (p = "button", E = "." + (v = "bs.button"), y = ".data-api", T = (m = e).fn[p], C = "active", I = "btn", D = '[data-toggle^="button"]', b = '[data-toggle="buttons"]', S = "input", w = ".active", N = ".btn", O = { CLICK_DATA_API: "click" + E + y, FOCUS_BLUR_DATA_API: (A = "focus") + E + y + " blur" + E + y }, k = function () { function n(t) { this._element = t } var t = n.prototype; return t.toggle = function () { var t = !0, e = !0, n = m(this._element).closest(b)[0]; if (n) { var i = m(this._element).find(S)[0]; if (i) { if ("radio" === i.type) if (i.checked && m(this._element).hasClass(C)) t = !1; else { var r = m(n).find(w)[0]; r && m(r).removeClass(C) } if (t) { if (i.hasAttribute("disabled") || n.hasAttribute("disabled") || i.classList.contains("disabled") || n.classList.contains("disabled")) return; i.checked = !m(this._element).hasClass(C), m(i).trigger("change") } i.focus(), e = !1 } } e && this._element.setAttribute("aria-pressed", !m(this._element).hasClass(C)), t && m(this._element).toggleClass(C) }, t.dispose = function () { m.removeData(this._element, v), this._element = null }, n._jQueryInterface = function (e) { return this.each(function () { var t = m(this).data(v); t || (t = new n(this), m(this).data(v, t)), "toggle" === e && t[e]() }) }, o(n, null, [{ key: "VERSION", get: function () { return "4.1.1" } }]), n }(), m(document).on(O.CLICK_DATA_API, D, function (t) { t.preventDefault(); var e = t.target; m(e).hasClass(I) || (e = m(e).closest(N)), k._jQueryInterface.call(m(e), "toggle") }).on(O.FOCUS_BLUR_DATA_API, D, function (t) { var e = m(t.target).closest(N)[0]; m(e).toggleClass(A, /^focus(in)?$/.test(t.type)) }), m.fn[p] = k._jQueryInterface, m.fn[p].Constructor = k, m.fn[p].noConflict = function () { return m.fn[p] = T, k._jQueryInterface }, k), Dn = (L = "carousel", R = "." + (j = "bs.carousel"), H = ".data-api", W = (P = e).fn[L], M = { interval: 5e3, keyboard: !0, slide: !1, pause: "hover", wrap: !0 }, x = { interval: "(number|boolean)", keyboard: "boolean", slide: "(boolean|string)", pause: "(string|boolean)", wrap: "boolean" }, U = "next", K = "prev", F = "left", V = "right", Q = { SLIDE: "slide" + R, SLID: "slid" + R, KEYDOWN: "keydown" + R, MOUSEENTER: "mouseenter" + R, MOUSELEAVE: "mouseleave" + R, TOUCHEND: "touchend" + R, LOAD_DATA_API: "load" + R + H, CLICK_DATA_API: "click" + R + H }, B = "carousel", Y = "active", G = "slide", q = "carousel-item-right", z = "carousel-item-left", X = "carousel-item-next", J = "carousel-item-prev", Z = { ACTIVE: ".active", ACTIVE_ITEM: ".active.carousel-item", ITEM: ".carousel-item", NEXT_PREV: ".carousel-item-next, .carousel-item-prev", INDICATORS: ".carousel-indicators", DATA_SLIDE: "[data-slide], [data-slide-to]", DATA_RIDE: '[data-ride="carousel"]' }, $ = function () { function s(t, e) { this._items = null, this._interval = null, this._activeElement = null, this._isPaused = !1, this._isSliding = !1, this.touchTimeout = null, this._config = this._getConfig(e), this._element = P(t)[0], this._indicatorsElement = P(this._element).find(Z.INDICATORS)[0], this._addEventListeners() } var t = s.prototype; return t.next = function () { this._isSliding || this._slide(U) }, t.nextWhenVisible = function () { !document.hidden && P(this._element).is(":visible") && "hidden" !== P(this._element).css("visibility") && this.next() }, t.prev = function () { this._isSliding || this._slide(K) }, t.pause = function (t) { t || (this._isPaused = !0), P(this._element).find(Z.NEXT_PREV)[0] && (Cn.triggerTransitionEnd(this._element), this.cycle(!0)), clearInterval(this._interval), this._interval = null }, t.cycle = function (t) { t || (this._isPaused = !1), this._interval && (clearInterval(this._interval), this._interval = null), this._config.interval && !this._isPaused && (this._interval = setInterval((document.visibilityState ? this.nextWhenVisible : this.next).bind(this), this._config.interval)) }, t.to = function (t) { var e = this; this._activeElement = P(this._element).find(Z.ACTIVE_ITEM)[0]; var n = this._getItemIndex(this._activeElement); if (!(t > this._items.length - 1 || t < 0)) if (this._isSliding) P(this._element).one(Q.SLID, function () { return e.to(t) }); else { if (n === t) return this.pause(), void this.cycle(); var i = n < t ? U : K; this._slide(i, this._items[t]) } }, t.dispose = function () { P(this._element).off(R), P.removeData(this._element, j), this._items = null, this._config = null, this._element = null, this._interval = null, this._isPaused = null, this._isSliding = null, this._activeElement = null, this._indicatorsElement = null }, t._getConfig = function (t) { return t = h({}, M, t), Cn.typeCheckConfig(L, t, x), t }, t._addEventListeners = function () { var e = this; this._config.keyboard && P(this._element).on(Q.KEYDOWN, function (t) { return e._keydown(t) }), "hover" === this._config.pause && (P(this._element).on(Q.MOUSEENTER, function (t) { return e.pause(t) }).on(Q.MOUSELEAVE, function (t) { return e.cycle(t) }), "ontouchstart" in document.documentElement && P(this._element).on(Q.TOUCHEND, function () { e.pause(), e.touchTimeout && clearTimeout(e.touchTimeout), e.touchTimeout = setTimeout(function (t) { return e.cycle(t) }, 500 + e._config.interval) })) }, t._keydown = function (t) { if (!/input|textarea/i.test(t.target.tagName)) switch (t.which) { case 37: t.preventDefault(), this.prev(); break; case 39: t.preventDefault(), this.next() } }, t._getItemIndex = function (t) { return this._items = P.makeArray(P(t).parent().find(Z.ITEM)), this._items.indexOf(t) }, t._getItemByDirection = function (t, e) { var n = t === U, i = t === K, r = this._getItemIndex(e), s = this._items.length - 1; if ((i && 0 === r || n && r === s) && !this._config.wrap) return e; var o = (r + (t === K ? -1 : 1)) % this._items.length; return -1 === o ? this._items[this._items.length - 1] : this._items[o] }, t._triggerSlideEvent = function (t, e) { var n = this._getItemIndex(t), i = this._getItemIndex(P(this._element).find(Z.ACTIVE_ITEM)[0]), r = P.Event(Q.SLIDE, { relatedTarget: t, direction: e, from: i, to: n }); return P(this._element).trigger(r), r }, t._setActiveIndicatorElement = function (t) { if (this._indicatorsElement) { P(this._indicatorsElement).find(Z.ACTIVE).removeClass(Y); var e = this._indicatorsElement.children[this._getItemIndex(t)]; e && P(e).addClass(Y) } }, t._slide = function (t, e) { var n, i, r, s = this, o = P(this._element).find(Z.ACTIVE_ITEM)[0], a = this._getItemIndex(o), l = e || o && this._getItemByDirection(t, o), h = this._getItemIndex(l), c = Boolean(this._interval); if (t === U ? (n = z, i = X, r = F) : (n = q, i = J, r = V), l && P(l).hasClass(Y)) this._isSliding = !1; else if (!this._triggerSlideEvent(l, r).isDefaultPrevented() && o && l) { this._isSliding = !0, c && this.pause(), this._setActiveIndicatorElement(l); var u = P.Event(Q.SLID, { relatedTarget: l, direction: r, from: a, to: h }); if (P(this._element).hasClass(G)) { P(l).addClass(i), Cn.reflow(l), P(o).addClass(n), P(l).addClass(n); var f = Cn.getTransitionDurationFromElement(o); P(o).one(Cn.TRANSITION_END, function () { P(l).removeClass(n + " " + i).addClass(Y), P(o).removeClass(Y + " " + i + " " + n), s._isSliding = !1, setTimeout(function () { return P(s._element).trigger(u) }, 0) }).emulateTransitionEnd(f) } else P(o).removeClass(Y), P(l).addClass(Y), this._isSliding = !1, P(this._element).trigger(u); c && this.cycle() } }, s._jQueryInterface = function (i) { return this.each(function () { var t = P(this).data(j), e = h({}, M, P(this).data()); "object" == typeof i && (e = h({}, e, i)); var n = "string" == typeof i ? i : e.slide; if (t || (t = new s(this, e), P(this).data(j, t)), "number" == typeof i) t.to(i); else if ("string" == typeof n) { if ("undefined" == typeof t[n]) throw new TypeError('No method named "' + n + '"'); t[n]() } else e.interval && (t.pause(), t.cycle()) }) }, s._dataApiClickHandler = function (t) { var e = Cn.getSelectorFromElement(this); if (e) { var n = P(e)[0]; if (n && P(n).hasClass(B)) { var i = h({}, P(n).data(), P(this).data()), r = this.getAttribute("data-slide-to"); r && (i.interval = !1), s._jQueryInterface.call(P(n), i), r && P(n).data(j).to(r), t.preventDefault() } } }, o(s, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return M } }]), s }(), P(document).on(Q.CLICK_DATA_API, Z.DATA_SLIDE, $._dataApiClickHandler), P(window).on(Q.LOAD_DATA_API, function () { P(Z.DATA_RIDE).each(function () { var t = P(this); $._jQueryInterface.call(t, t.data()) }) }), P.fn[L] = $._jQueryInterface, P.fn[L].Constructor = $, P.fn[L].noConflict = function () { return P.fn[L] = W, $._jQueryInterface }, $), bn = (et = "collapse", it = "." + (nt = "bs.collapse"), rt = (tt = e).fn[et], st = { toggle: !0, parent: "" }, ot = { toggle: "boolean", parent: "(string|element)" }, at = { SHOW: "show" + it, SHOWN: "shown" + it, HIDE: "hide" + it, HIDDEN: "hidden" + it, CLICK_DATA_API: "click" + it + ".data-api" }, lt = "show", ht = "collapse", ct = "collapsing", ut = "collapsed", ft = "width", dt = "height", _t = { ACTIVES: ".show, .collapsing", DATA_TOGGLE: '[data-toggle="collapse"]' }, gt = function () { function a(t, e) { this._isTransitioning = !1, this._element = t, this._config = this._getConfig(e), this._triggerArray = tt.makeArray(tt('[data-toggle="collapse"][href="#' + t.id + '"],[data-toggle="collapse"][data-target="#' + t.id + '"]')); for (var n = tt(_t.DATA_TOGGLE), i = 0; i < n.length; i++) { var r = n[i], s = Cn.getSelectorFromElement(r); null !== s && 0 < tt(s).filter(t).length && (this._selector = s, this._triggerArray.push(r)) } this._parent = this._config.parent ? this._getParent() : null, this._config.parent || this._addAriaAndCollapsedClass(this._element, this._triggerArray), this._config.toggle && this.toggle() } var t = a.prototype; return t.toggle = function () { tt(this._element).hasClass(lt) ? this.hide() : this.show() }, t.show = function () { var t, e, n = this; if (!this._isTransitioning && !tt(this._element).hasClass(lt) && (this._parent && 0 === (t = tt.makeArray(tt(this._parent).find(_t.ACTIVES).filter('[data-parent="' + this._config.parent + '"]'))).length && (t = null), !(t && (e = tt(t).not(this._selector).data(nt)) && e._isTransitioning))) { var i = tt.Event(at.SHOW); if (tt(this._element).trigger(i), !i.isDefaultPrevented()) { t && (a._jQueryInterface.call(tt(t).not(this._selector), "hide"), e || tt(t).data(nt, null)); var r = this._getDimension(); tt(this._element).removeClass(ht).addClass(ct), (this._element.style[r] = 0) < this._triggerArray.length && tt(this._triggerArray).removeClass(ut).attr("aria-expanded", !0), this.setTransitioning(!0); var s = "scroll" + (r[0].toUpperCase() + r.slice(1)), o = Cn.getTransitionDurationFromElement(this._element); tt(this._element).one(Cn.TRANSITION_END, function () { tt(n._element).removeClass(ct).addClass(ht).addClass(lt), n._element.style[r] = "", n.setTransitioning(!1), tt(n._element).trigger(at.SHOWN) }).emulateTransitionEnd(o), this._element.style[r] = this._element[s] + "px" } } }, t.hide = function () { var t = this; if (!this._isTransitioning && tt(this._element).hasClass(lt)) { var e = tt.Event(at.HIDE); if (tt(this._element).trigger(e), !e.isDefaultPrevented()) { var n = this._getDimension(); if (this._element.style[n] = this._element.getBoundingClientRect()[n] + "px", Cn.reflow(this._element), tt(this._element).addClass(ct).removeClass(ht).removeClass(lt), 0 < this._triggerArray.length) for (var i = 0; i < this._triggerArray.length; i++) { var r = this._triggerArray[i], s = Cn.getSelectorFromElement(r); if (null !== s) tt(s).hasClass(lt) || tt(r).addClass(ut).attr("aria-expanded", !1) } this.setTransitioning(!0); this._element.style[n] = ""; var o = Cn.getTransitionDurationFromElement(this._element); tt(this._element).one(Cn.TRANSITION_END, function () { t.setTransitioning(!1), tt(t._element).removeClass(ct).addClass(ht).trigger(at.HIDDEN) }).emulateTransitionEnd(o) } } }, t.setTransitioning = function (t) { this._isTransitioning = t }, t.dispose = function () { tt.removeData(this._element, nt), this._config = null, this._parent = null, this._element = null, this._triggerArray = null, this._isTransitioning = null }, t._getConfig = function (t) { return (t = h({}, st, t)).toggle = Boolean(t.toggle), Cn.typeCheckConfig(et, t, ot), t }, t._getDimension = function () { return tt(this._element).hasClass(ft) ? ft : dt }, t._getParent = function () { var n = this, t = null; Cn.isElement(this._config.parent) ? (t = this._config.parent, "undefined" != typeof this._config.parent.jquery && (t = this._config.parent[0])) : t = tt(this._config.parent)[0]; var e = '[data-toggle="collapse"][data-parent="' + this._config.parent + '"]'; return tt(t).find(e).each(function (t, e) { n._addAriaAndCollapsedClass(a._getTargetFromElement(e), [e]) }), t }, t._addAriaAndCollapsedClass = function (t, e) { if (t) { var n = tt(t).hasClass(lt); 0 < e.length && tt(e).toggleClass(ut, !n).attr("aria-expanded", n) } }, a._getTargetFromElement = function (t) { var e = Cn.getSelectorFromElement(t); return e ? tt(e)[0] : null }, a._jQueryInterface = function (i) { return this.each(function () { var t = tt(this), e = t.data(nt), n = h({}, st, t.data(), "object" == typeof i && i ? i : {}); if (!e && n.toggle && /show|hide/.test(i) && (n.toggle = !1), e || (e = new a(this, n), t.data(nt, e)), "string" == typeof i) { if ("undefined" == typeof e[i]) throw new TypeError('No method named "' + i + '"'); e[i]() } }) }, o(a, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return st } }]), a }(), tt(document).on(at.CLICK_DATA_API, _t.DATA_TOGGLE, function (t) { "A" === t.currentTarget.tagName && t.preventDefault(); var n = tt(this), e = Cn.getSelectorFromElement(this); tt(e).each(function () { var t = tt(this), e = t.data(nt) ? "toggle" : n.data(); gt._jQueryInterface.call(t, e) }) }), tt.fn[et] = gt._jQueryInterface, tt.fn[et].Constructor = gt, tt.fn[et].noConflict = function () { return tt.fn[et] = rt, gt._jQueryInterface }, gt), Sn = (pt = "dropdown", Et = "." + (vt = "bs.dropdown"), yt = ".data-api", Tt = (mt = e).fn[pt], Ct = new RegExp("38|40|27"), It = { HIDE: "hide" + Et, HIDDEN: "hidden" + Et, SHOW: "show" + Et, SHOWN: "shown" + Et, CLICK: "click" + Et, CLICK_DATA_API: "click" + Et + yt, KEYDOWN_DATA_API: "keydown" + Et + yt, KEYUP_DATA_API: "keyup" + Et + yt }, At = "disabled", Dt = "show", bt = "dropup", St = "dropright", wt = "dropleft", Nt = "dropdown-menu-right", Ot = "position-static", kt = '[data-toggle="dropdown"]', Pt = ".dropdown form", Lt = ".dropdown-menu", jt = ".navbar-nav", Rt = ".dropdown-menu .dropdown-item:not(.disabled):not(:disabled)", Ht = "top-start", Wt = "top-end", Mt = "bottom-start", xt = "bottom-end", Ut = "right-start", Kt = "left-start", Ft = { offset: 0, flip: !0, boundary: "scrollParent", reference: "toggle", display: "dynamic" }, Vt = { offset: "(number|string|function)", flip: "boolean", boundary: "(string|element)", reference: "(string|element)", display: "string" }, Qt = function () { function l(t, e) { this._element = t, this._popper = null, this._config = this._getConfig(e), this._menu = this._getMenuElement(), this._inNavbar = this._detectNavbar(), this._addEventListeners() } var t = l.prototype; return t.toggle = function () { if (!this._element.disabled && !mt(this._element).hasClass(At)) { var t = l._getParentFromElement(this._element), e = mt(this._menu).hasClass(Dt); if (l._clearMenus(), !e) { var n = { relatedTarget: this._element }, i = mt.Event(It.SHOW, n); if (mt(t).trigger(i), !i.isDefaultPrevented()) { if (!this._inNavbar) { if ("undefined" == typeof c) throw new TypeError("Bootstrap dropdown require Popper.js (https://popper.js.org)"); var r = this._element; "parent" === this._config.reference ? r = t : Cn.isElement(this._config.reference) && (r = this._config.reference, "undefined" != typeof this._config.reference.jquery && (r = this._config.reference[0])), "scrollParent" !== this._config.boundary && mt(t).addClass(Ot), this._popper = new c(r, this._menu, this._getPopperConfig()) } "ontouchstart" in document.documentElement && 0 === mt(t).closest(jt).length && mt(document.body).children().on("mouseover", null, mt.noop), this._element.focus(), this._element.setAttribute("aria-expanded", !0), mt(this._menu).toggleClass(Dt), mt(t).toggleClass(Dt).trigger(mt.Event(It.SHOWN, n)) } } } }, t.dispose = function () { mt.removeData(this._element, vt), mt(this._element).off(Et), this._element = null, (this._menu = null) !== this._popper && (this._popper.destroy(), this._popper = null) }, t.update = function () { this._inNavbar = this._detectNavbar(), null !== this._popper && this._popper.scheduleUpdate() }, t._addEventListeners = function () { var e = this; mt(this._element).on(It.CLICK, function (t) { t.preventDefault(), t.stopPropagation(), e.toggle() }) }, t._getConfig = function (t) { return t = h({}, this.constructor.Default, mt(this._element).data(), t), Cn.typeCheckConfig(pt, t, this.constructor.DefaultType), t }, t._getMenuElement = function () { if (!this._menu) { var t = l._getParentFromElement(this._element); this._menu = mt(t).find(Lt)[0] } return this._menu }, t._getPlacement = function () { var t = mt(this._element).parent(), e = Mt; return t.hasClass(bt) ? (e = Ht, mt(this._menu).hasClass(Nt) && (e = Wt)) : t.hasClass(St) ? e = Ut : t.hasClass(wt) ? e = Kt : mt(this._menu).hasClass(Nt) && (e = xt), e }, t._detectNavbar = function () { return 0 < mt(this._element).closest(".navbar").length }, t._getPopperConfig = function () { var e = this, t = {}; "function" == typeof this._config.offset ? t.fn = function (t) { return t.offsets = h({}, t.offsets, e._config.offset(t.offsets) || {}), t } : t.offset = this._config.offset; var n = { placement: this._getPlacement(), modifiers: { offset: t, flip: { enabled: this._config.flip }, preventOverflow: { boundariesElement: this._config.boundary } } }; return "static" === this._config.display && (n.modifiers.applyStyle = { enabled: !1 }), n }, l._jQueryInterface = function (e) { return this.each(function () { var t = mt(this).data(vt); if (t || (t = new l(this, "object" == typeof e ? e : null), mt(this).data(vt, t)), "string" == typeof e) { if ("undefined" == typeof t[e]) throw new TypeError('No method named "' + e + '"'); t[e]() } }) }, l._clearMenus = function (t) { if (!t || 3 !== t.which && ("keyup" !== t.type || 9 === t.which)) for (var e = mt.makeArray(mt(kt)), n = 0; n < e.length; n++) { var i = l._getParentFromElement(e[n]), r = mt(e[n]).data(vt), s = { relatedTarget: e[n] }; if (r) { var o = r._menu; if (mt(i).hasClass(Dt) && !(t && ("click" === t.type && /input|textarea/i.test(t.target.tagName) || "keyup" === t.type && 9 === t.which) && mt.contains(i, t.target))) { var a = mt.Event(It.HIDE, s); mt(i).trigger(a), a.isDefaultPrevented() || ("ontouchstart" in document.documentElement && mt(document.body).children().off("mouseover", null, mt.noop), e[n].setAttribute("aria-expanded", "false"), mt(o).removeClass(Dt), mt(i).removeClass(Dt).trigger(mt.Event(It.HIDDEN, s))) } } } }, l._getParentFromElement = function (t) { var e, n = Cn.getSelectorFromElement(t); return n && (e = mt(n)[0]), e || t.parentNode }, l._dataApiKeydownHandler = function (t) { if ((/input|textarea/i.test(t.target.tagName) ? !(32 === t.which || 27 !== t.which && (40 !== t.which && 38 !== t.which || mt(t.target).closest(Lt).length)) : Ct.test(t.which)) && (t.preventDefault(), t.stopPropagation(), !this.disabled && !mt(this).hasClass(At))) { var e = l._getParentFromElement(this), n = mt(e).hasClass(Dt); if ((n || 27 === t.which && 32 === t.which) && (!n || 27 !== t.which && 32 !== t.which)) { var i = mt(e).find(Rt).get(); if (0 !== i.length) { var r = i.indexOf(t.target); 38 === t.which && 0 < r && r-- , 40 === t.which && r < i.length - 1 && r++ , r < 0 && (r = 0), i[r].focus() } } else { if (27 === t.which) { var s = mt(e).find(kt)[0]; mt(s).trigger("focus") } mt(this).trigger("click") } } }, o(l, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return Ft } }, { key: "DefaultType", get: function () { return Vt } }]), l }(), mt(document).on(It.KEYDOWN_DATA_API, kt, Qt._dataApiKeydownHandler).on(It.KEYDOWN_DATA_API, Lt, Qt._dataApiKeydownHandler).on(It.CLICK_DATA_API + " " + It.KEYUP_DATA_API, Qt._clearMenus).on(It.CLICK_DATA_API, kt, function (t) { t.preventDefault(), t.stopPropagation(), Qt._jQueryInterface.call(mt(this), "toggle") }).on(It.CLICK_DATA_API, Pt, function (t) { t.stopPropagation() }), mt.fn[pt] = Qt._jQueryInterface, mt.fn[pt].Constructor = Qt, mt.fn[pt].noConflict = function () { return mt.fn[pt] = Tt, Qt._jQueryInterface }, Qt), wn = (Yt = "modal", qt = "." + (Gt = "bs.modal"), zt = (Bt = e).fn[Yt], Xt = { backdrop: !0, keyboard: !0, focus: !0, show: !0 }, Jt = { backdrop: "(boolean|string)", keyboard: "boolean", focus: "boolean", show: "boolean" }, Zt = { HIDE: "hide" + qt, HIDDEN: "hidden" + qt, SHOW: "show" + qt, SHOWN: "shown" + qt, FOCUSIN: "focusin" + qt, RESIZE: "resize" + qt, CLICK_DISMISS: "click.dismiss" + qt, KEYDOWN_DISMISS: "keydown.dismiss" + qt, MOUSEUP_DISMISS: "mouseup.dismiss" + qt, MOUSEDOWN_DISMISS: "mousedown.dismiss" + qt, CLICK_DATA_API: "click" + qt + ".data-api" }, $t = "modal-scrollbar-measure", te = "modal-backdrop", ee = "modal-open", ne = "fade", ie = "show", re = { DIALOG: ".modal-dialog", DATA_TOGGLE: '[data-toggle="modal"]', DATA_DISMISS: '[data-dismiss="modal"]', FIXED_CONTENT: ".fixed-top, .fixed-bottom, .is-fixed, .sticky-top", STICKY_CONTENT: ".sticky-top", NAVBAR_TOGGLER: ".navbar-toggler" }, se = function () { function r(t, e) { this._config = this._getConfig(e), this._element = t, this._dialog = Bt(t).find(re.DIALOG)[0], this._backdrop = null, this._isShown = !1, this._isBodyOverflowing = !1, this._ignoreBackdropClick = !1, this._scrollbarWidth = 0 } var t = r.prototype; return t.toggle = function (t) { return this._isShown ? this.hide() : this.show(t) }, t.show = function (t) { var e = this; if (!this._isTransitioning && !this._isShown) { Bt(this._element).hasClass(ne) && (this._isTransitioning = !0); var n = Bt.Event(Zt.SHOW, { relatedTarget: t }); Bt(this._element).trigger(n), this._isShown || n.isDefaultPrevented() || (this._isShown = !0, this._checkScrollbar(), this._setScrollbar(), this._adjustDialog(), Bt(document.body).addClass(ee), this._setEscapeEvent(), this._setResizeEvent(), Bt(this._element).on(Zt.CLICK_DISMISS, re.DATA_DISMISS, function (t) { return e.hide(t) }), Bt(this._dialog).on(Zt.MOUSEDOWN_DISMISS, function () { Bt(e._element).one(Zt.MOUSEUP_DISMISS, function (t) { Bt(t.target).is(e._element) && (e._ignoreBackdropClick = !0) }) }), this._showBackdrop(function () { return e._showElement(t) })) } }, t.hide = function (t) { var e = this; if (t && t.preventDefault(), !this._isTransitioning && this._isShown) { var n = Bt.Event(Zt.HIDE); if (Bt(this._element).trigger(n), this._isShown && !n.isDefaultPrevented()) { this._isShown = !1; var i = Bt(this._element).hasClass(ne); if (i && (this._isTransitioning = !0), this._setEscapeEvent(), this._setResizeEvent(), Bt(document).off(Zt.FOCUSIN), Bt(this._element).removeClass(ie), Bt(this._element).off(Zt.CLICK_DISMISS), Bt(this._dialog).off(Zt.MOUSEDOWN_DISMISS), i) { var r = Cn.getTransitionDurationFromElement(this._element); Bt(this._element).one(Cn.TRANSITION_END, function (t) { return e._hideModal(t) }).emulateTransitionEnd(r) } else this._hideModal() } } }, t.dispose = function () { Bt.removeData(this._element, Gt), Bt(window, document, this._element, this._backdrop).off(qt), this._config = null, this._element = null, this._dialog = null, this._backdrop = null, this._isShown = null, this._isBodyOverflowing = null, this._ignoreBackdropClick = null, this._scrollbarWidth = null }, t.handleUpdate = function () { this._adjustDialog() }, t._getConfig = function (t) { return t = h({}, Xt, t), Cn.typeCheckConfig(Yt, t, Jt), t }, t._showElement = function (t) { var e = this, n = Bt(this._element).hasClass(ne); this._element.parentNode && this._element.parentNode.nodeType === Node.ELEMENT_NODE || document.body.appendChild(this._element), this._element.style.display = "block", this._element.removeAttribute("aria-hidden"), this._element.scrollTop = 0, n && Cn.reflow(this._element), Bt(this._element).addClass(ie), this._config.focus && this._enforceFocus(); var i = Bt.Event(Zt.SHOWN, { relatedTarget: t }), r = function () { e._config.focus && e._element.focus(), e._isTransitioning = !1, Bt(e._element).trigger(i) }; if (n) { var s = Cn.getTransitionDurationFromElement(this._element); Bt(this._dialog).one(Cn.TRANSITION_END, r).emulateTransitionEnd(s) } else r() }, t._enforceFocus = function () { var e = this; Bt(document).off(Zt.FOCUSIN).on(Zt.FOCUSIN, function (t) { document !== t.target && e._element !== t.target && 0 === Bt(e._element).has(t.target).length && e._element.focus() }) }, t._setEscapeEvent = function () { var e = this; this._isShown && this._config.keyboard ? Bt(this._element).on(Zt.KEYDOWN_DISMISS, function (t) { 27 === t.which && (t.preventDefault(), e.hide()) }) : this._isShown || Bt(this._element).off(Zt.KEYDOWN_DISMISS) }, t._setResizeEvent = function () { var e = this; this._isShown ? Bt(window).on(Zt.RESIZE, function (t) { return e.handleUpdate(t) }) : Bt(window).off(Zt.RESIZE) }, t._hideModal = function () { var t = this; this._element.style.display = "none", this._element.setAttribute("aria-hidden", !0), this._isTransitioning = !1, this._showBackdrop(function () { Bt(document.body).removeClass(ee), t._resetAdjustments(), t._resetScrollbar(), Bt(t._element).trigger(Zt.HIDDEN) }) }, t._removeBackdrop = function () { this._backdrop && (Bt(this._backdrop).remove(), this._backdrop = null) }, t._showBackdrop = function (t) { var e = this, n = Bt(this._element).hasClass(ne) ? ne : ""; if (this._isShown && this._config.backdrop) { if (this._backdrop = document.createElement("div"), this._backdrop.className = te, n && Bt(this._backdrop).addClass(n), Bt(this._backdrop).appendTo(document.body), Bt(this._element).on(Zt.CLICK_DISMISS, function (t) { e._ignoreBackdropClick ? e._ignoreBackdropClick = !1 : t.target === t.currentTarget && ("static" === e._config.backdrop ? e._element.focus() : e.hide()) }), n && Cn.reflow(this._backdrop), Bt(this._backdrop).addClass(ie), !t) return; if (!n) return void t(); var i = Cn.getTransitionDurationFromElement(this._backdrop); Bt(this._backdrop).one(Cn.TRANSITION_END, t).emulateTransitionEnd(i) } else if (!this._isShown && this._backdrop) { Bt(this._backdrop).removeClass(ie); var r = function () { e._removeBackdrop(), t && t() }; if (Bt(this._element).hasClass(ne)) { var s = Cn.getTransitionDurationFromElement(this._backdrop); Bt(this._backdrop).one(Cn.TRANSITION_END, r).emulateTransitionEnd(s) } else r() } else t && t() }, t._adjustDialog = function () { var t = this._element.scrollHeight > document.documentElement.clientHeight; !this._isBodyOverflowing && t && (this._element.style.paddingLeft = this._scrollbarWidth + "px"), this._isBodyOverflowing && !t && (this._element.style.paddingRight = this._scrollbarWidth + "px") }, t._resetAdjustments = function () { this._element.style.paddingLeft = "", this._element.style.paddingRight = "" }, t._checkScrollbar = function () { var t = document.body.getBoundingClientRect(); this._isBodyOverflowing = t.left + t.right < window.innerWidth, this._scrollbarWidth = this._getScrollbarWidth() }, t._setScrollbar = function () { var r = this; if (this._isBodyOverflowing) { Bt(re.FIXED_CONTENT).each(function (t, e) { var n = Bt(e)[0].style.paddingRight, i = Bt(e).css("padding-right"); Bt(e).data("padding-right", n).css("padding-right", parseFloat(i) + r._scrollbarWidth + "px") }), Bt(re.STICKY_CONTENT).each(function (t, e) { var n = Bt(e)[0].style.marginRight, i = Bt(e).css("margin-right"); Bt(e).data("margin-right", n).css("margin-right", parseFloat(i) - r._scrollbarWidth + "px") }), Bt(re.NAVBAR_TOGGLER).each(function (t, e) { var n = Bt(e)[0].style.marginRight, i = Bt(e).css("margin-right"); Bt(e).data("margin-right", n).css("margin-right", parseFloat(i) + r._scrollbarWidth + "px") }); var t = document.body.style.paddingRight, e = Bt(document.body).css("padding-right"); Bt(document.body).data("padding-right", t).css("padding-right", parseFloat(e) + this._scrollbarWidth + "px") } }, t._resetScrollbar = function () { Bt(re.FIXED_CONTENT).each(function (t, e) { var n = Bt(e).data("padding-right"); "undefined" != typeof n && Bt(e).css("padding-right", n).removeData("padding-right") }), Bt(re.STICKY_CONTENT + ", " + re.NAVBAR_TOGGLER).each(function (t, e) { var n = Bt(e).data("margin-right"); "undefined" != typeof n && Bt(e).css("margin-right", n).removeData("margin-right") }); var t = Bt(document.body).data("padding-right"); "undefined" != typeof t && Bt(document.body).css("padding-right", t).removeData("padding-right") }, t._getScrollbarWidth = function () { var t = document.createElement("div"); t.className = $t, document.body.appendChild(t); var e = t.getBoundingClientRect().width - t.clientWidth; return document.body.removeChild(t), e }, r._jQueryInterface = function (n, i) { return this.each(function () { var t = Bt(this).data(Gt), e = h({}, Xt, Bt(this).data(), "object" == typeof n && n ? n : {}); if (t || (t = new r(this, e), Bt(this).data(Gt, t)), "string" == typeof n) { if ("undefined" == typeof t[n]) throw new TypeError('No method named "' + n + '"'); t[n](i) } else e.show && t.show(i) }) }, o(r, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return Xt } }]), r }(), Bt(document).on(Zt.CLICK_DATA_API, re.DATA_TOGGLE, function (t) { var e, n = this, i = Cn.getSelectorFromElement(this); i && (e = Bt(i)[0]); var r = Bt(e).data(Gt) ? "toggle" : h({}, Bt(e).data(), Bt(this).data()); "A" !== this.tagName && "AREA" !== this.tagName || t.preventDefault(); var s = Bt(e).one(Zt.SHOW, function (t) { t.isDefaultPrevented() || s.one(Zt.HIDDEN, function () { Bt(n).is(":visible") && n.focus() }) }); se._jQueryInterface.call(Bt(e), r, this) }), Bt.fn[Yt] = se._jQueryInterface, Bt.fn[Yt].Constructor = se, Bt.fn[Yt].noConflict = function () { return Bt.fn[Yt] = zt, se._jQueryInterface }, se), Nn = (ae = "tooltip", he = "." + (le = "bs.tooltip"), ce = (oe = e).fn[ae], ue = "bs-tooltip", fe = new RegExp("(^|\\s)" + ue + "\\S+", "g"), ge = { animation: !0, template: '<div class="tooltip" role="tooltip"><div class="arrow"></div><div class="tooltip-inner"></div></div>', trigger: "hover focus", title: "", delay: 0, html: !(_e = { AUTO: "auto", TOP: "top", RIGHT: "right", BOTTOM: "bottom", LEFT: "left" }), selector: !(de = { animation: "boolean", template: "string", title: "(string|element|function)", trigger: "string", delay: "(number|object)", html: "boolean", selector: "(string|boolean)", placement: "(string|function)", offset: "(number|string)", container: "(string|element|boolean)", fallbackPlacement: "(string|array)", boundary: "(string|element)" }), placement: "top", offset: 0, container: !1, fallbackPlacement: "flip", boundary: "scrollParent" }, pe = "out", ve = { HIDE: "hide" + he, HIDDEN: "hidden" + he, SHOW: (me = "show") + he, SHOWN: "shown" + he, INSERTED: "inserted" + he, CLICK: "click" + he, FOCUSIN: "focusin" + he, FOCUSOUT: "focusout" + he, MOUSEENTER: "mouseenter" + he, MOUSELEAVE: "mouseleave" + he }, Ee = "fade", ye = "show", Te = ".tooltip-inner", Ce = ".arrow", Ie = "hover", Ae = "focus", De = "click", be = "manual", Se = function () { function i(t, e) { if ("undefined" == typeof c) throw new TypeError("Bootstrap tooltips require Popper.js (https://popper.js.org)"); this._isEnabled = !0, this._timeout = 0, this._hoverState = "", this._activeTrigger = {}, this._popper = null, this.element = t, this.config = this._getConfig(e), this.tip = null, this._setListeners() } var t = i.prototype; return t.enable = function () { this._isEnabled = !0 }, t.disable = function () { this._isEnabled = !1 }, t.toggleEnabled = function () { this._isEnabled = !this._isEnabled }, t.toggle = function (t) { if (this._isEnabled) if (t) { var e = this.constructor.DATA_KEY, n = oe(t.currentTarget).data(e); n || (n = new this.constructor(t.currentTarget, this._getDelegateConfig()), oe(t.currentTarget).data(e, n)), n._activeTrigger.click = !n._activeTrigger.click, n._isWithActiveTrigger() ? n._enter(null, n) : n._leave(null, n) } else { if (oe(this.getTipElement()).hasClass(ye)) return void this._leave(null, this); this._enter(null, this) } }, t.dispose = function () { clearTimeout(this._timeout), oe.removeData(this.element, this.constructor.DATA_KEY), oe(this.element).off(this.constructor.EVENT_KEY), oe(this.element).closest(".modal").off("hide.bs.modal"), this.tip && oe(this.tip).remove(), this._isEnabled = null, this._timeout = null, this._hoverState = null, (this._activeTrigger = null) !== this._popper && this._popper.destroy(), this._popper = null, this.element = null, this.config = null, this.tip = null }, t.show = function () { var e = this; if ("none" === oe(this.element).css("display")) throw new Error("Please use show on visible elements"); var t = oe.Event(this.constructor.Event.SHOW); if (this.isWithContent() && this._isEnabled) { oe(this.element).trigger(t); var n = oe.contains(this.element.ownerDocument.documentElement, this.element); if (t.isDefaultPrevented() || !n) return; var i = this.getTipElement(), r = Cn.getUID(this.constructor.NAME); i.setAttribute("id", r), this.element.setAttribute("aria-describedby", r), this.setContent(), this.config.animation && oe(i).addClass(Ee); var s = "function" == typeof this.config.placement ? this.config.placement.call(this, i, this.element) : this.config.placement, o = this._getAttachment(s); this.addAttachmentClass(o); var a = !1 === this.config.container ? document.body : oe(this.config.container); oe(i).data(this.constructor.DATA_KEY, this), oe.contains(this.element.ownerDocument.documentElement, this.tip) || oe(i).appendTo(a), oe(this.element).trigger(this.constructor.Event.INSERTED), this._popper = new c(this.element, i, { placement: o, modifiers: { offset: { offset: this.config.offset }, flip: { behavior: this.config.fallbackPlacement }, arrow: { element: Ce }, preventOverflow: { boundariesElement: this.config.boundary } }, onCreate: function (t) { t.originalPlacement !== t.placement && e._handlePopperPlacementChange(t) }, onUpdate: function (t) { e._handlePopperPlacementChange(t) } }), oe(i).addClass(ye), "ontouchstart" in document.documentElement && oe(document.body).children().on("mouseover", null, oe.noop); var l = function () { e.config.animation && e._fixTransition(); var t = e._hoverState; e._hoverState = null, oe(e.element).trigger(e.constructor.Event.SHOWN), t === pe && e._leave(null, e) }; if (oe(this.tip).hasClass(Ee)) { var h = Cn.getTransitionDurationFromElement(this.tip); oe(this.tip).one(Cn.TRANSITION_END, l).emulateTransitionEnd(h) } else l() } }, t.hide = function (t) { var e = this, n = this.getTipElement(), i = oe.Event(this.constructor.Event.HIDE), r = function () { e._hoverState !== me && n.parentNode && n.parentNode.removeChild(n), e._cleanTipClass(), e.element.removeAttribute("aria-describedby"), oe(e.element).trigger(e.constructor.Event.HIDDEN), null !== e._popper && e._popper.destroy(), t && t() }; if (oe(this.element).trigger(i), !i.isDefaultPrevented()) { if (oe(n).removeClass(ye), "ontouchstart" in document.documentElement && oe(document.body).children().off("mouseover", null, oe.noop), this._activeTrigger[De] = !1, this._activeTrigger[Ae] = !1, this._activeTrigger[Ie] = !1, oe(this.tip).hasClass(Ee)) { var s = Cn.getTransitionDurationFromElement(n); oe(n).one(Cn.TRANSITION_END, r).emulateTransitionEnd(s) } else r(); this._hoverState = "" } }, t.update = function () { null !== this._popper && this._popper.scheduleUpdate() }, t.isWithContent = function () { return Boolean(this.getTitle()) }, t.addAttachmentClass = function (t) { oe(this.getTipElement()).addClass(ue + "-" + t) }, t.getTipElement = function () { return this.tip = this.tip || oe(this.config.template)[0], this.tip }, t.setContent = function () { var t = oe(this.getTipElement()); this.setElementContent(t.find(Te), this.getTitle()), t.removeClass(Ee + " " + ye) }, t.setElementContent = function (t, e) { var n = this.config.html; "object" == typeof e && (e.nodeType || e.jquery) ? n ? oe(e).parent().is(t) || t.empty().append(e) : t.text(oe(e).text()) : t[n ? "html" : "text"](e) }, t.getTitle = function () { var t = this.element.getAttribute("data-original-title"); return t || (t = "function" == typeof this.config.title ? this.config.title.call(this.element) : this.config.title), t }, t._getAttachment = function (t) { return _e[t.toUpperCase()] }, t._setListeners = function () { var i = this; this.config.trigger.split(" ").forEach(function (t) { if ("click" === t) oe(i.element).on(i.constructor.Event.CLICK, i.config.selector, function (t) { return i.toggle(t) }); else if (t !== be) { var e = t === Ie ? i.constructor.Event.MOUSEENTER : i.constructor.Event.FOCUSIN, n = t === Ie ? i.constructor.Event.MOUSELEAVE : i.constructor.Event.FOCUSOUT; oe(i.element).on(e, i.config.selector, function (t) { return i._enter(t) }).on(n, i.config.selector, function (t) { return i._leave(t) }) } oe(i.element).closest(".modal").on("hide.bs.modal", function () { return i.hide() }) }), this.config.selector ? this.config = h({}, this.config, { trigger: "manual", selector: "" }) : this._fixTitle() }, t._fixTitle = function () { var t = typeof this.element.getAttribute("data-original-title"); (this.element.getAttribute("title") || "string" !== t) && (this.element.setAttribute("data-original-title", this.element.getAttribute("title") || ""), this.element.setAttribute("title", "")) }, t._enter = function (t, e) { var n = this.constructor.DATA_KEY; (e = e || oe(t.currentTarget).data(n)) || (e = new this.constructor(t.currentTarget, this._getDelegateConfig()), oe(t.currentTarget).data(n, e)), t && (e._activeTrigger["focusin" === t.type ? Ae : Ie] = !0), oe(e.getTipElement()).hasClass(ye) || e._hoverState === me ? e._hoverState = me : (clearTimeout(e._timeout), e._hoverState = me, e.config.delay && e.config.delay.show ? e._timeout = setTimeout(function () { e._hoverState === me && e.show() }, e.config.delay.show) : e.show()) }, t._leave = function (t, e) { var n = this.constructor.DATA_KEY; (e = e || oe(t.currentTarget).data(n)) || (e = new this.constructor(t.currentTarget, this._getDelegateConfig()), oe(t.currentTarget).data(n, e)), t && (e._activeTrigger["focusout" === t.type ? Ae : Ie] = !1), e._isWithActiveTrigger() || (clearTimeout(e._timeout), e._hoverState = pe, e.config.delay && e.config.delay.hide ? e._timeout = setTimeout(function () { e._hoverState === pe && e.hide() }, e.config.delay.hide) : e.hide()) }, t._isWithActiveTrigger = function () { for (var t in this._activeTrigger) if (this._activeTrigger[t]) return !0; return !1 }, t._getConfig = function (t) { return "number" == typeof (t = h({}, this.constructor.Default, oe(this.element).data(), "object" == typeof t && t ? t : {})).delay && (t.delay = { show: t.delay, hide: t.delay }), "number" == typeof t.title && (t.title = t.title.toString()), "number" == typeof t.content && (t.content = t.content.toString()), Cn.typeCheckConfig(ae, t, this.constructor.DefaultType), t }, t._getDelegateConfig = function () { var t = {}; if (this.config) for (var e in this.config) this.constructor.Default[e] !== this.config[e] && (t[e] = this.config[e]); return t }, t._cleanTipClass = function () { var t = oe(this.getTipElement()), e = t.attr("class").match(fe); null !== e && 0 < e.length && t.removeClass(e.join("")) }, t._handlePopperPlacementChange = function (t) { this._cleanTipClass(), this.addAttachmentClass(this._getAttachment(t.placement)) }, t._fixTransition = function () { var t = this.getTipElement(), e = this.config.animation; null === t.getAttribute("x-placement") && (oe(t).removeClass(Ee), this.config.animation = !1, this.hide(), this.show(), this.config.animation = e) }, i._jQueryInterface = function (n) { return this.each(function () { var t = oe(this).data(le), e = "object" == typeof n && n; if ((t || !/dispose|hide/.test(n)) && (t || (t = new i(this, e), oe(this).data(le, t)), "string" == typeof n)) { if ("undefined" == typeof t[n]) throw new TypeError('No method named "' + n + '"'); t[n]() } }) }, o(i, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return ge } }, { key: "NAME", get: function () { return ae } }, { key: "DATA_KEY", get: function () { return le } }, { key: "Event", get: function () { return ve } }, { key: "EVENT_KEY", get: function () { return he } }, { key: "DefaultType", get: function () { return de } }]), i }(), oe.fn[ae] = Se._jQueryInterface, oe.fn[ae].Constructor = Se, oe.fn[ae].noConflict = function () { return oe.fn[ae] = ce, Se._jQueryInterface }, Se), On = (Ne = "popover", ke = "." + (Oe = "bs.popover"), Pe = (we = e).fn[Ne], Le = "bs-popover", je = new RegExp("(^|\\s)" + Le + "\\S+", "g"), Re = h({}, Nn.Default, { placement: "right", trigger: "click", content: "", template: '<div class="popover" role="tooltip"><div class="arrow"></div><h3 class="popover-header"></h3><div class="popover-body"></div></div>' }), He = h({}, Nn.DefaultType, { content: "(string|element|function)" }), We = "fade", xe = ".popover-header", Ue = ".popover-body", Ke = { HIDE: "hide" + ke, HIDDEN: "hidden" + ke, SHOW: (Me = "show") + ke, SHOWN: "shown" + ke, INSERTED: "inserted" + ke, CLICK: "click" + ke, FOCUSIN: "focusin" + ke, FOCUSOUT: "focusout" + ke, MOUSEENTER: "mouseenter" + ke, MOUSELEAVE: "mouseleave" + ke }, Fe = function (t) { var e, n; function i() { return t.apply(this, arguments) || this } n = t, (e = i).prototype = Object.create(n.prototype), (e.prototype.constructor = e).__proto__ = n; var r = i.prototype; return r.isWithContent = function () { return this.getTitle() || this._getContent() }, r.addAttachmentClass = function (t) { we(this.getTipElement()).addClass(Le + "-" + t) }, r.getTipElement = function () { return this.tip = this.tip || we(this.config.template)[0], this.tip }, r.setContent = function () { var t = we(this.getTipElement()); this.setElementContent(t.find(xe), this.getTitle()); var e = this._getContent(); "function" == typeof e && (e = e.call(this.element)), this.setElementContent(t.find(Ue), e), t.removeClass(We + " " + Me) }, r._getContent = function () { return this.element.getAttribute("data-content") || this.config.content }, r._cleanTipClass = function () { var t = we(this.getTipElement()), e = t.attr("class").match(je); null !== e && 0 < e.length && t.removeClass(e.join("")) }, i._jQueryInterface = function (n) { return this.each(function () { var t = we(this).data(Oe), e = "object" == typeof n ? n : null; if ((t || !/destroy|hide/.test(n)) && (t || (t = new i(this, e), we(this).data(Oe, t)), "string" == typeof n)) { if ("undefined" == typeof t[n]) throw new TypeError('No method named "' + n + '"'); t[n]() } }) }, o(i, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return Re } }, { key: "NAME", get: function () { return Ne } }, { key: "DATA_KEY", get: function () { return Oe } }, { key: "Event", get: function () { return Ke } }, { key: "EVENT_KEY", get: function () { return ke } }, { key: "DefaultType", get: function () { return He } }]), i }(Nn), we.fn[Ne] = Fe._jQueryInterface, we.fn[Ne].Constructor = Fe, we.fn[Ne].noConflict = function () { return we.fn[Ne] = Pe, Fe._jQueryInterface }, Fe), kn = (Qe = "scrollspy", Ye = "." + (Be = "bs.scrollspy"), Ge = (Ve = e).fn[Qe], qe = { offset: 10, method: "auto", target: "" }, ze = { offset: "number", method: "string", target: "(string|element)" }, Xe = { ACTIVATE: "activate" + Ye, SCROLL: "scroll" + Ye, LOAD_DATA_API: "load" + Ye + ".data-api" }, Je = "dropdown-item", Ze = "active", $e = { DATA_SPY: '[data-spy="scroll"]', ACTIVE: ".active", NAV_LIST_GROUP: ".nav, .list-group", NAV_LINKS: ".nav-link", NAV_ITEMS: ".nav-item", LIST_ITEMS: ".list-group-item", DROPDOWN: ".dropdown", DROPDOWN_ITEMS: ".dropdown-item", DROPDOWN_TOGGLE: ".dropdown-toggle" }, tn = "offset", en = "position", nn = function () { function n(t, e) { var n = this; this._element = t, this._scrollElement = "BODY" === t.tagName ? window : t, this._config = this._getConfig(e), this._selector = this._config.target + " " + $e.NAV_LINKS + "," + this._config.target + " " + $e.LIST_ITEMS + "," + this._config.target + " " + $e.DROPDOWN_ITEMS, this._offsets = [], this._targets = [], this._activeTarget = null, this._scrollHeight = 0, Ve(this._scrollElement).on(Xe.SCROLL, function (t) { return n._process(t) }), this.refresh(), this._process() } var t = n.prototype; return t.refresh = function () { var e = this, t = this._scrollElement === this._scrollElement.window ? tn : en, r = "auto" === this._config.method ? t : this._config.method, s = r === en ? this._getScrollTop() : 0; this._offsets = [], this._targets = [], this._scrollHeight = this._getScrollHeight(), Ve.makeArray(Ve(this._selector)).map(function (t) { var e, n = Cn.getSelectorFromElement(t); if (n && (e = Ve(n)[0]), e) { var i = e.getBoundingClientRect(); if (i.width || i.height) return [Ve(e)[r]().top + s, n] } return null }).filter(function (t) { return t }).sort(function (t, e) { return t[0] - e[0] }).forEach(function (t) { e._offsets.push(t[0]), e._targets.push(t[1]) }) }, t.dispose = function () { Ve.removeData(this._element, Be), Ve(this._scrollElement).off(Ye), this._element = null, this._scrollElement = null, this._config = null, this._selector = null, this._offsets = null, this._targets = null, this._activeTarget = null, this._scrollHeight = null }, t._getConfig = function (t) { if ("string" != typeof (t = h({}, qe, "object" == typeof t && t ? t : {})).target) { var e = Ve(t.target).attr("id"); e || (e = Cn.getUID(Qe), Ve(t.target).attr("id", e)), t.target = "#" + e } return Cn.typeCheckConfig(Qe, t, ze), t }, t._getScrollTop = function () { return this._scrollElement === window ? this._scrollElement.pageYOffset : this._scrollElement.scrollTop }, t._getScrollHeight = function () { return this._scrollElement.scrollHeight || Math.max(document.body.scrollHeight, document.documentElement.scrollHeight) }, t._getOffsetHeight = function () { return this._scrollElement === window ? window.innerHeight : this._scrollElement.getBoundingClientRect().height }, t._process = function () { var t = this._getScrollTop() + this._config.offset, e = this._getScrollHeight(), n = this._config.offset + e - this._getOffsetHeight(); if (this._scrollHeight !== e && this.refresh(), n <= t) { var i = this._targets[this._targets.length - 1]; this._activeTarget !== i && this._activate(i) } else { if (this._activeTarget && t < this._offsets[0] && 0 < this._offsets[0]) return this._activeTarget = null, void this._clear(); for (var r = this._offsets.length; r--;) { this._activeTarget !== this._targets[r] && t >= this._offsets[r] && ("undefined" == typeof this._offsets[r + 1] || t < this._offsets[r + 1]) && this._activate(this._targets[r]) } } }, t._activate = function (e) { this._activeTarget = e, this._clear(); var t = this._selector.split(","); t = t.map(function (t) { return t + '[data-target="' + e + '"],' + t + '[href="' + e + '"]' }); var n = Ve(t.join(",")); n.hasClass(Je) ? (n.closest($e.DROPDOWN).find($e.DROPDOWN_TOGGLE).addClass(Ze), n.addClass(Ze)) : (n.addClass(Ze), n.parents($e.NAV_LIST_GROUP).prev($e.NAV_LINKS + ", " + $e.LIST_ITEMS).addClass(Ze), n.parents($e.NAV_LIST_GROUP).prev($e.NAV_ITEMS).children($e.NAV_LINKS).addClass(Ze)), Ve(this._scrollElement).trigger(Xe.ACTIVATE, { relatedTarget: e }) }, t._clear = function () { Ve(this._selector).filter($e.ACTIVE).removeClass(Ze) }, n._jQueryInterface = function (e) { return this.each(function () { var t = Ve(this).data(Be); if (t || (t = new n(this, "object" == typeof e && e), Ve(this).data(Be, t)), "string" == typeof e) { if ("undefined" == typeof t[e]) throw new TypeError('No method named "' + e + '"'); t[e]() } }) }, o(n, null, [{ key: "VERSION", get: function () { return "4.1.1" } }, { key: "Default", get: function () { return qe } }]), n }(), Ve(window).on(Xe.LOAD_DATA_API, function () { for (var t = Ve.makeArray(Ve($e.DATA_SPY)), e = t.length; e--;) { var n = Ve(t[e]); nn._jQueryInterface.call(n, n.data()) } }), Ve.fn[Qe] = nn._jQueryInterface, Ve.fn[Qe].Constructor = nn, Ve.fn[Qe].noConflict = function () { return Ve.fn[Qe] = Ge, nn._jQueryInterface }, nn), Pn = (on = "." + (sn = "bs.tab"), an = (rn = e).fn.tab, ln = { HIDE: "hide" + on, HIDDEN: "hidden" + on, SHOW: "show" + on, SHOWN: "shown" + on, CLICK_DATA_API: "click" + on + ".data-api" }, hn = "dropdown-menu", cn = "active", un = "disabled", fn = "fade", dn = "show", _n = ".dropdown", gn = ".nav, .list-group", mn = ".active", pn = "> li > .active", vn = '[data-toggle="tab"], [data-toggle="pill"], [data-toggle="list"]', En = ".dropdown-toggle", yn = "> .dropdown-menu .active", Tn = function () { function i(t) { this._element = t } var t = i.prototype; return t.show = function () { var n = this; if (!(this._element.parentNode && this._element.parentNode.nodeType === Node.ELEMENT_NODE && rn(this._element).hasClass(cn) || rn(this._element).hasClass(un))) { var t, i, e = rn(this._element).closest(gn)[0], r = Cn.getSelectorFromElement(this._element); if (e) { var s = "UL" === e.nodeName ? pn : mn; i = (i = rn.makeArray(rn(e).find(s)))[i.length - 1] } var o = rn.Event(ln.HIDE, { relatedTarget: this._element }), a = rn.Event(ln.SHOW, { relatedTarget: i }); if (i && rn(i).trigger(o), rn(this._element).trigger(a), !a.isDefaultPrevented() && !o.isDefaultPrevented()) { r && (t = rn(r)[0]), this._activate(this._element, e); var l = function () { var t = rn.Event(ln.HIDDEN, { relatedTarget: n._element }), e = rn.Event(ln.SHOWN, { relatedTarget: i }); rn(i).trigger(t), rn(n._element).trigger(e) }; t ? this._activate(t, t.parentNode, l) : l() } } }, t.dispose = function () { rn.removeData(this._element, sn), this._element = null }, t._activate = function (t, e, n) { var i = this, r = ("UL" === e.nodeName ? rn(e).find(pn) : rn(e).children(mn))[0], s = n && r && rn(r).hasClass(fn), o = function () { return i._transitionComplete(t, r, n) }; if (r && s) { var a = Cn.getTransitionDurationFromElement(r); rn(r).one(Cn.TRANSITION_END, o).emulateTransitionEnd(a) } else o() }, t._transitionComplete = function (t, e, n) { if (e) { rn(e).removeClass(dn + " " + cn); var i = rn(e.parentNode).find(yn)[0]; i && rn(i).removeClass(cn), "tab" === e.getAttribute("role") && e.setAttribute("aria-selected", !1) } if (rn(t).addClass(cn), "tab" === t.getAttribute("role") && t.setAttribute("aria-selected", !0), Cn.reflow(t), rn(t).addClass(dn), t.parentNode && rn(t.parentNode).hasClass(hn)) { var r = rn(t).closest(_n)[0]; r && rn(r).find(En).addClass(cn), t.setAttribute("aria-expanded", !0) } n && n() }, i._jQueryInterface = function (n) { return this.each(function () { var t = rn(this), e = t.data(sn); if (e || (e = new i(this), t.data(sn, e)), "string" == typeof n) { if ("undefined" == typeof e[n]) throw new TypeError('No method named "' + n + '"'); e[n]() } }) }, o(i, null, [{ key: "VERSION", get: function () { return "4.1.1" } }]), i }(), rn(document).on(ln.CLICK_DATA_API, vn, function (t) { t.preventDefault(), Tn._jQueryInterface.call(rn(this), "show") }), rn.fn.tab = Tn._jQueryInterface, rn.fn.tab.Constructor = Tn, rn.fn.tab.noConflict = function () { return rn.fn.tab = an, Tn._jQueryInterface }, Tn); !function (t) { if ("undefined" == typeof t) throw new TypeError("Bootstrap's JavaScript requires jQuery. jQuery must be included before Bootstrap's JavaScript."); var e = t.fn.jquery.split(" ")[0].split("."); if (e[0] < 2 && e[1] < 9 || 1 === e[0] && 9 === e[1] && e[2] < 1 || 4 <= e[0]) throw new Error("Bootstrap's JavaScript requires at least jQuery v1.9.1 but less than v4.0.0") }(e), t.Util = Cn, t.Alert = In, t.Button = An, t.Carousel = Dn, t.Collapse = bn, t.Dropdown = Sn, t.Modal = wn, t.Popover = On, t.Scrollspy = kn, t.Tab = Pn, t.Tooltip = Nn, Object.defineProperty(t, "__esModule", { value: !0 }) });
+//# sourceMappingURL=bootstrap.min.js.map
\ No newline at end of file
diff --git a/plugins/filterizr/jquery.filterizr.min.js b/plugins/filterizr/jquery.filterizr.min.js
new file mode 100644
index 00000000..af5c9e60
--- /dev/null
+++ b/plugins/filterizr/jquery.filterizr.min.js
@@ -0,0 +1 @@
+!function(t){function e(i){if(r[i])return r[i].exports;var n=r[i]={i:i,l:!1,exports:{}};return t[i].call(n.exports,n,n.exports,e),n.l=!0,n.exports}var r={};e.m=t,e.c=r,e.d=function(t,r,i){e.o(t,r)||Object.defineProperty(t,r,{configurable:!1,enumerable:!0,get:i})},e.n=function(t){var r=t&&t.__esModule?function(){return t.default}:function(){return t};return e.d(r,"a",r),r},e.o=function(t,e){return Object.prototype.hasOwnProperty.call(t,e)},e.p="",e(e.s=4)}([function(t,e,r){"use strict";r.d(e,"b",function(){return n}),r.d(e,"h",function(){return o}),r.d(e,"i",function(){return s}),r.d(e,"g",function(){return a}),r.d(e,"e",function(){return l}),r.d(e,"j",function(){return u}),r.d(e,"f",function(){return c}),r.d(e,"k",function(){return f}),r.d(e,"c",function(){return p}),r.d(e,"d",function(){return h}),r.d(e,"l",function(){return d}),r.d(e,"a",function(){return v});var i="function"==typeof Symbol&&"symbol"==typeof Symbol.iterator?function(t){return typeof t}:function(t){return t&&"function"==typeof Symbol&&t.constructor===Symbol&&t!==Symbol.prototype?"symbol":typeof t},n=function(t,e){for(var r=0;r<t.length;r++){for(var i=!1,n=t[r],o=0;o<e.length;o++)n===e[o]&&(i=!0);if(!i)return!1}return!0},o=function(t){var e={};for(var r in t)e[r]=t[r];return e},s=function t(e,r){var n=o(r);for(var s in e)s in n?"object"!==i(n[s])||"object"!==i(e[s])||Array.isArray(e[s])||(n[s]=t("object"===i(n[s])?n[s]:{},e[s])):n[s]=e[s];return n},a=function(t,e){return Array.prototype.filter.call(t,function(t){return e.includes(t)})},l=function(t,e,r){var i=void 0;return function(){var n=this,o=arguments;clearTimeout(i),i=setTimeout(function(){i=null,r||t.apply(n,o)},e),r&&!i&&t.apply(n,o)}},u=function(t){for(var e=t.slice(0),r=[];0!==e.length;){var i=Math.floor(e.length*Math.random());r.push(e[i]),e.splice(i,1)}return r},c=function(t,e){if(t.length!==e.length)return!1;for(var r=0;r<t.length;r++)if(t[r].props.index!==e[r].props.index)return!1;return!0},f=function(t,e){return t.slice(0).sort(function(t){return function(e,r){var i=t(e),n=t(r);return i<n?-1:i>n?1:0}}(e))},p=function(t,e,r,n,o){if(void 0!==e){var s=new Error('Filterizr: expected type of option "'+t+'" to be "'+r+'", but its type is: "'+(void 0===e?"undefined":i(e))+'"'),a=!1,l=!1,u=r.includes("array");if((void 0===e?"undefined":i(e)).match(r)?a=!0:!a&&u&&(l=Array.isArray(e)),!a&&!u)throw s;if(!a&&u&&!l)throw s;var c=function(t){return t?" For further help read here: "+t:""};if(Array.isArray(n)){var f=!1;if(n.forEach(function(t){t===e&&(f=!0)}),!f)throw new Error('Filterizr: allowed values for option "'+t+'" are: '+n.map(function(t){return'"'+t+'"'}).join(", ")+'. Value received: "'+e+'".'+c(o))}else if(n instanceof RegExp){var p=e.match(n);if(!p)throw new Error('Filterizr: invalid value "'+e+'" for option "'+t+'" received.'+c(o))}}},h=/(^linear$)|(^ease-in-out$)|(^ease-in$)|(^ease-out$)|(^ease$)|(^step-start$)|(^step-end$)|(^steps\(\d\s*,\s*(end|start)\))$|(^cubic-bezier\((\d*\.*\d+)\s*,\s*(\d*\.*\d+)\s*,\s*(\d*\.*\d+)\s*,\s*(\d*\.*\d+)\))$/,d="\n  webkitTransitionEnd.Filterizr \n  otransitionend.Filterizr \n  oTransitionEnd.Filterizr \n  msTransitionEnd.Filterizr \n  transitionend.Filterizr\n",v={IDLE:"IDLE",FILTERING:"FILTERING",SORTING:"SORTING",SHUFFLING:"SHUFFLING"}},function(t,e,r){"use strict";function i(t,e){if(!(t instanceof e))throw new TypeError("Cannot call a class as a function")}var n=r(2),o=r(0),s=function(){function t(t,e){for(var r=0;r<e.length;r++){var i=e[r];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}return function(e,r,i){return r&&t(e.prototype,r),i&&t(e,i),e}}(),a=window.jQuery,l=function(){function t(){var e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:".filtr-container",r=arguments[1];i(this,t),this.$node=a(e),this.$node.css({padding:0,position:"relative",width:"100%",display:"flex","flex-wrap":"wrap"}),this.props={FilterItems:this.getFilterItems(r),w:this.getWidth(),h:0},this.updateFilterItemsDimensions()}return s(t,[{key:"destroy",value:function(){this.$node.attr("style","").find(".filtr-item").attr("style",""),this.unbindEvents()}},{key:"getFilterItems",value:function(t){return a.map(this.$node.find(".filtr-item"),function(e,r){return new n.a(a(e),r,t)})}},{key:"push",value:function(t,e){var r=this.props.FilterItems;this.$node.append(t);var i=r.length,o=new n.a(t,i,e);this.props.FilterItems.push(o)}},{key:"calcColumns",value:function(){return Math.round(this.props.w/this.props.FilterItems[0].props.w)}},{key:"updateFilterItemsTransitionStyle",value:function(t,e,r,i){this.props.FilterItems.forEach(function(n){return n.$node.css({transition:"all "+t+"s "+e+" "+n.calcDelay(r,i)+"ms"})})}},{key:"updateHeight",value:function(t){this.props.h=t,this.$node.css("height",t)}},{key:"updateWidth",value:function(){this.props.w=this.getWidth()}},{key:"updateFilterItemsDimensions",value:function(){this.props.FilterItems.forEach(function(t){return t.updateDimensions()})}},{key:"getWidth",value:function(){return this.$node.innerWidth()}},{key:"bindTransitionEnd",value:function(t,e){this.$node.on(o.l,Object(o.e)(function(){t()},e))}},{key:"bindEvents",value:function(t){this.$node.on("filteringStart.Filterizr",t.onFilteringStart),this.$node.on("filteringEnd.Filterizr",t.onFilteringEnd),this.$node.on("shufflingStart.Filterizr",t.onShufflingStart),this.$node.on("shufflingEnd.Filterizr",t.onShufflingEnd),this.$node.on("sortingStart.Filterizr",t.onSortingStart),this.$node.on("sortingEnd.Filterizr",t.onSortingEnd)}},{key:"unbindEvents",value:function(){this.$node.off(o.l+"\n      filteringStart.Filterizr \n      filteringEnd.Filterizr \n      shufflingStart.Filterizr \n      shufflingEnd.Filterizr \n      sortingStart.Filterizr \n      sortingEnd.Filterizr")}},{key:"trigger",value:function(t){this.$node.trigger(t)}}]),t}();e.a=l},function(t,e,r){"use strict";function i(t,e){if(!(t instanceof e))throw new TypeError("Cannot call a class as a function")}var n=r(0),o=function(){function t(t,e){for(var r=0;r<e.length;r++){var i=e[r];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}return function(e,r,i){return r&&t(e.prototype,r),i&&t(e,i),e}}(),s=function(){function t(e,r,n){var o=this;i(this,t);var s=n.delay,a=n.delayMode,l=n.filterOutCss,u=n.animationDuration,c=n.easing;this.$node=e,this.props={data:function(){var t=o.$node.data();return delete t.category,delete t.sort,t}(),index:r,sortData:this.$node.data("sort"),lastPosition:{left:0,top:0},filteredOut:!1,w:this.getWidth(),h:this.getHeight()},this.$node.css(l).css({"-webkit-backface-visibility":"hidden",perspective:"1000px","-webkit-perspective":"1000px","-webkit-transform-style":"preserve-3d",position:"absolute",transition:"all "+u+"s "+c+" "+this.calcDelay(s,a)+"ms"}),this.bindEvents()}return o(t,[{key:"filterIn",value:function(t,e){var r=Object(n.h)(e);r.transform+=" translate3d("+t.left+"px,"+t.top+"px, 0)",this.$node.css(r),this.props.lastPosition=t,this.props.filteredOut=!1}},{key:"filterOut",value:function(t){var e=Object(n.h)(t),r=this.props.lastPosition;e.transform+=" translate3d("+r.left+"px,"+r.top+"px, 0)",this.$node.css(e),this.props.filteredOut=!0}},{key:"calcDelay",value:function(t,e){var r=0;return"progressive"===e?r=t*this.props.index:this.props.index%2==0&&(r=t),r}},{key:"contentsMatchSearch",value:function(t){return Boolean(this.getContentsLowercase().includes(t))}},{key:"getContentsLowercase",value:function(){return this.$node.text().toLowerCase()}},{key:"getCategories",value:function(){return this.$node.attr("data-category").split(/\s*,\s*/g)}},{key:"getHeight",value:function(){return this.$node.innerHeight()}},{key:"getWidth",value:function(){return this.$node.innerWidth()}},{key:"trigger",value:function(t){this.$node.trigger(t)}},{key:"updateDimensions",value:function(){this.props.w=this.getWidth(),this.props.h=this.getHeight()}},{key:"bindEvents",value:function(){var t=this;this.$node.on(n.l,function(){var e=t.props.filteredOut;t.$node.toggleClass("filteredOut",e),t.$node.css("z-index",e?-1e3:"")})}},{key:"unbindEvents",value:function(){this.$node.off(n.l)}}]),t}();e.a=s},function(t,e,r){"use strict";var i={animationDuration:.5,callbacks:{onFilteringStart:function(){},onFilteringEnd:function(){},onShufflingStart:function(){},onShufflingEnd:function(){},onSortingStart:function(){},onSortingEnd:function(){}},controlsSelector:"",delay:0,delayMode:"progressive",easing:"ease-out",filter:"all",filterOutCss:{opacity:0,transform:"scale(0.5)"},filterInCss:{opacity:1,transform:"scale(1)"},layout:"sameSize",multifilterLogicalOperator:"or",setupControls:!0};e.a=i},function(t,e,r){t.exports=r(5)},function(t,e,r){"use strict";function i(t){if(Array.isArray(t)){for(var e=0,r=Array(t.length);e<t.length;e++)r[e]=t[e];return r}return Array.from(t)}Object.defineProperty(e,"__esModule",{value:!0});var n=r(6),o=r(1),s=r(2),a=r(3),l=r(15);r.d(e,"Filterizr",function(){return n.a}),r.d(e,"FilterContainer",function(){return o.a}),r.d(e,"FilterItem",function(){return s.a}),r.d(e,"DefaultOptions",function(){return a.a});var u="function"==typeof Symbol&&"symbol"==typeof Symbol.iterator?function(t){return typeof t}:function(t){return t&&"function"==typeof Symbol&&t.constructor===Symbol&&t!==Symbol.prototype?"symbol":typeof t},c=void 0,f=void 0;c=f=window.jQuery,function(t){if(!t)throw new Error("Filterizr requires jQuery to work.");Object(l.a)(),t.fn.filterizr=function(){var e="."+t.trim(this.get(0).className).replace(/\s+/g,"."),r=arguments;if(!this._fltr&&0===r.length||1===r.length&&"object"===u(r[0])){var o=r.length>0?r[0]:a.a;this._fltr=new n.a(e,o)}else if(r.length>=1&&"string"==typeof r[0]){var s=r[0],l=Array.prototype.slice.call(r,1),c=this._fltr;switch(s){case"filter":return c.filter.apply(c,i(l)),this;case"insertItem":return c.insertItem.apply(c,i(l)),this;case"toggleFilter":return c.toggleFilter.apply(c,i(l)),this;case"sort":return c.sort.apply(c,i(l)),this;case"shuffle":return c.shuffle.apply(c,i(l)),this;case"search":return c.search.apply(c,i(l)),this;case"setOptions":return c.setOptions.apply(c,i(l)),this;case"destroy":return c.destroy.apply(c,i(l)),delete this._fltr,this;default:throw new Error("Filterizr: "+s+" is not part of the Filterizr API. Please refer to the docs for more information.")}}return this}}(f),e.default=c,r(16)},function(t,e,r){"use strict";function i(t,e){if(!(t instanceof e))throw new TypeError("Cannot call a class as a function")}var n=r(7),o=r(1),s=r(8),a=r(3),l=r(0),u=function(){function t(t,e){for(var r=0;r<e.length;r++){var i=e[r];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}return function(e,r,i){return r&&t(e.prototype,r),i&&t(e,i),e}}(),c=window.jQuery,f=function(){function t(){var e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:".filtr-container",r=arguments[1];i(this,t),this.options=Object(l.i)(a.a,r);var s=new o.a(e,this.options);if(!s.$node.length)throw new Error("Filterizr: could not find a container with the selector "+e+", to initialize Filterizr.");new n.a(this,this.options.controlsSelector),this.props={filterizrState:l.a.IDLE,searchTerm:"",sort:"index",sortOrder:"asc",FilterContainer:s,FilterItems:s.props.FilterItems,FilteredItems:[]},this.bindEvents(),this.filter(this.options.filter)}return u(t,[{key:"filter",value:function(t){var e=this.props,r=e.searchTerm,i=e.FilterContainer,n=e.FilterItems;i.trigger("filteringStart"),this.props.filterizrState=l.a.FILTERING,t=Array.isArray(t)?t.map(function(t){return t.toString()}):t.toString();var o=this.searchFilterItems(this.filterFilterItems(n,t),r);this.props.FilteredItems=o,this.render(o)}},{key:"destroy",value:function(){var t=this.props.FilterContainer,e=this.options.controlsSelector;t.destroy(),c(window).off("resize.Filterizr"),c(e+"[data-filter]").off("click.Filterizr"),c(e+"[data-multifilter]").off("click.Filterizr"),c(e+"[data-shuffle]").off("click.Filterizr"),c(e+"[data-search]").off("keyup.Filterizr"),c(e+"[data-sortAsc]").off("click.Filterizr"),c(e+"[data-sortDesc]").off("click.Filterizr")}},{key:"insertItem",value:function(t){var e=this.props.FilterContainer,r=t.clone().attr("style","");e.push(r,this.options);var i=this.filterFilterItems(this.props.FilterItems,this.options.filter);this.render(i)}},{key:"sort",value:function(){var t=arguments.length>0&&void 0!==arguments[0]?arguments[0]:"index",e=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"asc",r=this.props,i=r.FilterContainer,n=r.FilterItems;i.trigger("sortingStart"),this.props.filterizrState=l.a.SORTING,this.props.FilterItems=this.sortFilterItems(n,t,e);var o=this.filterFilterItems(this.props.FilterItems,this.options.filter);this.props.FilteredItems=o,this.render(o)}},{key:"search",value:function(){var t=arguments.length>0&&void 0!==arguments[0]?arguments[0]:this.props.searchTerm,e=this.props.FilterItems,r=this.searchFilterItems(this.filterFilterItems(e,this.options.filter),t);this.props.FilteredItems=r,this.render(r)}},{key:"shuffle",value:function(){var t=this.props,e=t.FilterContainer,r=t.FilteredItems;e.trigger("shufflingStart"),this.props.filterizrState=l.a.SHUFFLING;var i=this.shuffleFilterItems(r);this.props.FilteredItems=i,this.render(i)}},{key:"setOptions",value:function(t){Object(l.c)("animationDuration",t.animationDuration,"number"),Object(l.c)("callbacks",t.callbacks,"object"),Object(l.c)("controlsSelector",t.controlsSelector,"string"),Object(l.c)("delay",t.delay,"number"),Object(l.c)("easing",t.easing,"string",l.d,"https://www.w3schools.com/cssref/css3_pr_transition-timing-function.asp"),Object(l.c)("delayMode",t.delayMode,"string",["progressive","alternate"]),Object(l.c)("filter",t.filter,"string|number|array"),Object(l.c)("filterOutCss",t.filterOutCss,"object"),Object(l.c)("filterInCss",t.filterOutCss,"object"),Object(l.c)("layout",t.layout,"string",["sameSize","vertical","horizontal","sameHeight","sameWidth","packed"]),Object(l.c)("multifilterLogicalOperator",t.multifilterLogicalOperator,"string",["and","or"]),Object(l.c)("setupControls",t.setupControls,"boolean"),this.options=Object(l.i)(this.options,t),(t.animationDuration||t.delay||t.delayMode||t.easing)&&this.props.FilterContainer.updateFilterItemsTransitionStyle(t.animationDuration,t.easing,t.delay,t.delayMode),(t.callbacks||t.animationDuration)&&this.rebindFilterContainerEvents(),t.filter&&this.filter(t.filter),t.multifilterLogicalOperator&&this.filter(this.options.filter)}},{key:"toggleFilter",value:function(t){var e=this.options.filter;"all"===e?e=t:Array.isArray(e)?e.includes(t)?(e=e.filter(function(e){return e!==t}),1===e.length&&(e=e[0])):e.push(t):e=e===t?"all":[e,t],this.options.filter=e,this.filter(this.options.filter)}},{key:"filterFilterItems",value:function(t,e){var r=this.options.multifilterLogicalOperator;return"all"===e?t:t.filter(function(t){var i=t.getCategories();return Array.isArray(e)?"or"===r?Object(l.g)(i,e).length:Object(l.b)(e,i):i.includes(e)})}},{key:"sortFilterItems",value:function(t){var e=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"index",r=arguments.length>2&&void 0!==arguments[2]?arguments[2]:"asc",i=Object(l.k)(t,function(t){return"index"!==e&&"sortData"!==e?t.props.data[e]:t.props[e]});return"asc"===r?i:i.reverse()}},{key:"searchFilterItems",value:function(t){var e=arguments.length>1&&void 0!==arguments[1]?arguments[1]:this.props.searchTerm;return e?t.filter(function(t){return t.contentsMatchSearch(e)}):t}},{key:"shuffleFilterItems",value:function(t){for(var e=Object(l.j)(t);t.length>1&&Object(l.f)(t,e);)e=Object(l.j)(t);return e}},{key:"render",value:function(t){var e=this,r=this.options,i=r.filter,n=r.filterInCss,o=r.filterOutCss,a=r.layout,u=r.multifilterLogicalOperator;this.props.FilterItems.filter(function(t){var r=t.getCategories(),n=Array.isArray(i),o=t.contentsMatchSearch(e.props.searchTerm);return!(n?"or"===u?Object(l.g)(r,i).length:Object(l.b)(i,r):r.includes(i))||!o}).forEach(function(t){t.filterOut(o)});var c=Object(s.a)(a,this);t.forEach(function(t,e){t.filterIn(c[e],n)})}},{key:"onTransitionEndCallback",value:function(){var t=this.props,e=t.filterizrState,r=t.FilterContainer;switch(e){case l.a.FILTERING:r.trigger("filteringEnd");break;case l.a.SORTING:r.trigger("sortingEnd");break;case l.a.SHUFFLING:r.trigger("shufflingEnd")}this.props.filterizrState=l.a.IDLE}},{key:"rebindFilterContainerEvents",value:function(){var t=this,e=this.props.FilterContainer,r=this.options,i=r.animationDuration,n=r.callbacks;e.unbindEvents(),e.bindEvents(n),e.bindTransitionEnd(function(){t.onTransitionEndCallback()},i)}},{key:"bindEvents",value:function(){var t=this,e=this.props.FilterContainer;this.rebindFilterContainerEvents(),c(window).on("resize.Filterizr",Object(l.e)(function(){e.updateWidth(),e.updateFilterItemsDimensions(),t.filter(t.options.filter)},250))}}]),t}();e.a=f},function(t,e,r){"use strict";function i(t,e){if(!(t instanceof e))throw new TypeError("Cannot call a class as a function")}var n=r(0),o=function(){function t(t,e){for(var r=0;r<e.length;r++){var i=e[r];i.enumerable=i.enumerable||!1,i.configurable=!0,"value"in i&&(i.writable=!0),Object.defineProperty(t,i.key,i)}}return function(e,r,i){return r&&t(e.prototype,r),i&&t(e,i),e}}(),s=window.jQuery,a=function(){function t(e){var r=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"";i(this,t),this.props={Filterizr:e,selector:r},this.setupFilterControls(),this.setupShuffleControls(),this.setupSearchControls(),this.setupSortControls()}return o(t,[{key:"setupFilterControls",value:function(){var t=this.props,e=t.Filterizr,r=t.selector;s(r+"[data-filter]").on("click.Filterizr",function(t){var r=s(t.currentTarget),i=r.attr("data-filter");e.options.filter=i,e.filter(e.options.filter)}),s(r+"[data-multifilter]").on("click.Filterizr",function(t){var r=s(t.target),i=r.attr("data-multifilter");e.toggleFilter(i)})}},{key:"setupShuffleControls",value:function(){var t=this.props,e=t.Filterizr,r=t.selector;s(r+"[data-shuffle]").on("click.Filterizr",function(){e.shuffle()})}},{key:"setupSearchControls",value:function(){var t=this.props,e=t.Filterizr,r=t.selector;s(r+"[data-search]").on("keyup.Filterizr",Object(n.e)(function(t){var r=s(t.target),i=r.val();e.props.searchTerm=i.toLowerCase(),e.search(e.props.searchTerm)},250))}},{key:"setupSortControls",value:function(){var t=this.props,e=t.Filterizr,r=t.selector;s(r+"[data-sortAsc]").on("click.Filterizr",function(){var t=s(r+"[data-sortOrder]").val();e.props.sortOrder="asc",e.sort(t,"asc")}),s(r+"[data-sortDesc]").on("click.Filterizr",function(){var t=s(r+"[data-sortOrder]").val();e.props.sortOrder="desc",e.sort(t,"desc")})}}]),t}();e.a=a},function(t,e,r){"use strict";var i=r(9),n=r(10),o=r(11),s=r(12),a=r(13),l=r(14),u=function(t,e){switch(t){case"horizontal":return Object(i.a)(e);case"vertical":return Object(n.a)(e);case"sameHeight":return Object(o.a)(e);case"sameWidth":return Object(s.a)(e);case"sameSize":return Object(a.a)(e);case"packed":return Object(l.a)(e);default:return Object(a.a)(e)}};e.a=u},function(t,e,r){"use strict";var i=function(t){var e=t.props,r=e.FilterContainer,i=e.FilteredItems,n=0,o=0,s=i.map(function(t){var e=t.props,r=e.w,i=e.h,s={left:n,top:0};return n+=r,i>o&&(o=i),s});return r.updateHeight(o),s};e.a=i},function(t,e,r){"use strict";var i=function(t){var e=t.props,r=e.FilterContainer,i=e.FilteredItems,n=0,o=i.map(function(t){var e=t.props.h,r={left:0,top:n};return n+=e,r});return r.updateHeight(n),o};e.a=i},function(t,e,r){"use strict";var i=function(t){var e=t.props,r=e.FilterContainer,i=e.FilteredItems,n=r.props.w,o=i[0].props.h,s=0,a=0,l=i.map(function(t){var e=t.props.w;a+e>n&&(s++,a=0);var r={left:a,top:o*s};return a+=e,r});return r.updateHeight((s+1)*i[0].props.h),l};e.a=i},function(t,e,r){"use strict";function i(t){if(Array.isArray(t)){for(var e=0,r=Array(t.length);e<t.length;e++)r[e]=t[e];return r}return Array.from(t)}var n=function(t){var e=t.props,r=e.FilterContainer,n=e.FilteredItems,s=r.calcColumns(),a=0,l=Array.apply(null,Array(s)).map(Number.prototype.valueOf,0),u=n.map(function(t,e){var r=t.props,i=r.w,u=r.h;e%s==0&&e>=s&&a++;var c=e-s*a;return l[c]+=u,{left:c*i,top:o(n,s,e)}});return r.updateHeight(Math.max.apply(Math,i(l))),u},o=function(t,e,r){if(e<=0)return 0;var i=0;if(r<e-1)return 0;for(r-=e;r>=0;)i+=t[r].props.h,r-=e;return i};e.a=n},function(t,e,r){"use strict";var i=function(t){var e=t.props,r=e.FilterContainer,i=e.FilteredItems,n=r.calcColumns(),o=0,s=i.map(function(t,e){return e%n==0&&e>=n&&o++,{left:(e-n*o)*t.props.w,top:o*t.props.h}}),a=i[0]&&i[0].props.h||0;return r.updateHeight((o+1)*a),s};e.a=i},function(t,e,r){"use strict";var i=function(t){var e=t.props,r=e.FilterContainer,i=e.FilteredItems,o=new n(r.props.w),s=i.map(function(t){var e=t.props;return{w:e.w,h:e.h}});o.fit(s);var a=s.map(function(t){var e=t.fit;return{left:e.x,top:e.y}});return r.updateHeight(o.root.h),a},n=function(t){this.init(t)};n.prototype={init:function(t){this.root={x:0,y:0,w:t}},fit:function(t){var e,r,i,n=t.length,o=n>0?t[0].h:0;for(this.root.h=o,e=0;e<n;e++)i=t[e],(r=this.findNode(this.root,i.w,i.h))?i.fit=this.splitNode(r,i.w,i.h):i.fit=this.growDown(i.w,i.h)},findNode:function(t,e,r){return t.used?this.findNode(t.right,e,r)||this.findNode(t.down,e,r):e<=t.w&&r<=t.h?t:null},splitNode:function(t,e,r){return t.used=!0,t.down={x:t.x,y:t.y+r,w:t.w,h:t.h-r},t.right={x:t.x+e,y:t.y,w:t.w-e,h:r},t},growDown:function(t,e){var r;return this.root={used:!0,x:0,y:0,w:this.root.w,h:this.root.h+e,down:{x:0,y:this.root.h,w:this.root.w,h:e},right:this.root},(r=this.findNode(this.root,t,e))?this.splitNode(r,t,e):null}},e.a=i},function(t,e,r){"use strict";function i(){String.prototype.includes||(String.prototype.includes=function(t,e){return"number"!=typeof e&&(e=0),!(e+t.length>this.length)&&-1!==this.indexOf(t,e)}),Array.prototype.includes||Object.defineProperty(Array.prototype,"includes",{value:function(t,e){if(null==this)throw new TypeError('"this" is null or not defined');var r=Object(this),i=r.length>>>0;if(0===i)return!1;for(var n=0|e,o=Math.max(n>=0?n:i-Math.abs(n),0);o<i;){if(function(t,e){return t===e||"number"==typeof t&&"number"==typeof e&&isNaN(t)&&isNaN(e)}(r[o],t))return!0;o++}return!1}})}e.a=i},function(t,e,r){}]);
\ No newline at end of file
diff --git a/plugins/fontawesome/font-awesome.min.css b/plugins/fontawesome/font-awesome.min.css
new file mode 100644
index 00000000..0e0645d2
--- /dev/null
+++ b/plugins/fontawesome/font-awesome.min.css
@@ -0,0 +1,4 @@
+/*!
+ *  Font Awesome 4.7.0 by @davegandy - http://fontawesome.io - @fontawesome
+ *  License - http://fontawesome.io/license (Font: SIL OFL 1.1, CSS: MIT License)
+ */@font-face{font-family:'FontAwesome';src:url('fonts/fontawesome-webfont.eot?v=4.7.0');src:url('fonts/fontawesome-webfont.eot?#iefix&v=4.7.0') format('embedded-opentype'),url('fonts/fontawesome-webfont.woff2?v=4.7.0') format('woff2'),url('fonts/fontawesome-webfont.woff?v=4.7.0') format('woff'),url('fonts/fontawesome-webfont.ttf?v=4.7.0') format('truetype'),url('fonts/fontawesome-webfont.svg?v=4.7.0#fontawesomeregular') format('svg');font-weight:normal;font-style:normal}.fa{display:inline-block;font:normal normal normal 14px/1 FontAwesome;font-size:inherit;text-rendering:auto;-webkit-font-smoothing:antialiased;-moz-osx-font-smoothing:grayscale}.fa-lg{font-size:1.33333333em;line-height:.75em;vertical-align:-15%}.fa-2x{font-size:2em}.fa-3x{font-size:3em}.fa-4x{font-size:4em}.fa-5x{font-size:5em}.fa-fw{width:1.28571429em;text-align:center}.fa-ul{padding-left:0;margin-left:2.14285714em;list-style-type:none}.fa-ul>li{position:relative}.fa-li{position:absolute;left:-2.14285714em;width:2.14285714em;top:.14285714em;text-align:center}.fa-li.fa-lg{left:-1.85714286em}.fa-border{padding:.2em .25em .15em;border:solid .08em #eee;border-radius:.1em}.fa-pull-left{float:left}.fa-pull-right{float:right}.fa.fa-pull-left{margin-right:.3em}.fa.fa-pull-right{margin-left:.3em}.pull-right{float:right}.pull-left{float:left}.fa.pull-left{margin-right:.3em}.fa.pull-right{margin-left:.3em}.fa-spin{-webkit-animation:fa-spin 2s infinite linear;animation:fa-spin 2s infinite linear}.fa-pulse{-webkit-animation:fa-spin 1s infinite steps(8);animation:fa-spin 1s infinite steps(8)}@-webkit-keyframes fa-spin{0%{-webkit-transform:rotate(0deg);transform:rotate(0deg)}100%{-webkit-transform:rotate(359deg);transform:rotate(359deg)}}@keyframes fa-spin{0%{-webkit-transform:rotate(0deg);transform:rotate(0deg)}100%{-webkit-transform:rotate(359deg);transform:rotate(359deg)}}.fa-rotate-90{-ms-filter:"progid:DXImageTransform.Microsoft.BasicImage(rotation=1)";-webkit-transform:rotate(90deg);-ms-transform:rotate(90deg);transform:rotate(90deg)}.fa-rotate-180{-ms-filter:"progid:DXImageTransform.Microsoft.BasicImage(rotation=2)";-webkit-transform:rotate(180deg);-ms-transform:rotate(180deg);transform:rotate(180deg)}.fa-rotate-270{-ms-filter:"progid:DXImageTransform.Microsoft.BasicImage(rotation=3)";-webkit-transform:rotate(270deg);-ms-transform:rotate(270deg);transform:rotate(270deg)}.fa-flip-horizontal{-ms-filter:"progid:DXImageTransform.Microsoft.BasicImage(rotation=0, mirror=1)";-webkit-transform:scale(-1, 1);-ms-transform:scale(-1, 1);transform:scale(-1, 1)}.fa-flip-vertical{-ms-filter:"progid:DXImageTransform.Microsoft.BasicImage(rotation=2, mirror=1)";-webkit-transform:scale(1, -1);-ms-transform:scale(1, -1);transform:scale(1, -1)}:root .fa-rotate-90,:root .fa-rotate-180,:root .fa-rotate-270,:root .fa-flip-horizontal,:root .fa-flip-vertical{filter:none}.fa-stack{position:relative;display:inline-block;width:2em;height:2em;line-height:2em;vertical-align:middle}.fa-stack-1x,.fa-stack-2x{position:absolute;left:0;width:100%;text-align:center}.fa-stack-1x{line-height:inherit}.fa-stack-2x{font-size:2em}.fa-inverse{color:#fff}.fa-glass:before{content:"\f000"}.fa-music:before{content:"\f001"}.fa-search:before{content:"\f002"}.fa-envelope-o:before{content:"\f003"}.fa-heart:before{content:"\f004"}.fa-star:before{content:"\f005"}.fa-star-o:before{content:"\f006"}.fa-user:before{content:"\f007"}.fa-film:before{content:"\f008"}.fa-th-large:before{content:"\f009"}.fa-th:before{content:"\f00a"}.fa-th-list:before{content:"\f00b"}.fa-check:before{content:"\f00c"}.fa-remove:before,.fa-close:before,.fa-times:before{content:"\f00d"}.fa-search-plus:before{content:"\f00e"}.fa-search-minus:before{content:"\f010"}.fa-power-off:before{content:"\f011"}.fa-signal:before{content:"\f012"}.fa-gear:before,.fa-cog:before{content:"\f013"}.fa-trash-o:before{content:"\f014"}.fa-home:before{content:"\f015"}.fa-file-o:before{content:"\f016"}.fa-clock-o:before{content:"\f017"}.fa-road:before{content:"\f018"}.fa-download:before{content:"\f019"}.fa-arrow-circle-o-down:before{content:"\f01a"}.fa-arrow-circle-o-up:before{content:"\f01b"}.fa-inbox:before{content:"\f01c"}.fa-play-circle-o:before{content:"\f01d"}.fa-rotate-right:before,.fa-repeat:before{content:"\f01e"}.fa-refresh:before{content:"\f021"}.fa-list-alt:before{content:"\f022"}.fa-lock:before{content:"\f023"}.fa-flag:before{content:"\f024"}.fa-headphones:before{content:"\f025"}.fa-volume-off:before{content:"\f026"}.fa-volume-down:before{content:"\f027"}.fa-volume-up:before{content:"\f028"}.fa-qrcode:before{content:"\f029"}.fa-barcode:before{content:"\f02a"}.fa-tag:before{content:"\f02b"}.fa-tags:before{content:"\f02c"}.fa-book:before{content:"\f02d"}.fa-bookmark:before{content:"\f02e"}.fa-print:before{content:"\f02f"}.fa-camera:before{content:"\f030"}.fa-font:before{content:"\f031"}.fa-bold:before{content:"\f032"}.fa-italic:before{content:"\f033"}.fa-text-height:before{content:"\f034"}.fa-text-width:before{content:"\f035"}.fa-align-left:before{content:"\f036"}.fa-align-center:before{content:"\f037"}.fa-align-right:before{content:"\f038"}.fa-align-justify:before{content:"\f039"}.fa-list:before{content:"\f03a"}.fa-dedent:before,.fa-outdent:before{content:"\f03b"}.fa-indent:before{content:"\f03c"}.fa-video-camera:before{content:"\f03d"}.fa-photo:before,.fa-image:before,.fa-picture-o:before{content:"\f03e"}.fa-pencil:before{content:"\f040"}.fa-map-marker:before{content:"\f041"}.fa-adjust:before{content:"\f042"}.fa-tint:before{content:"\f043"}.fa-edit:before,.fa-pencil-square-o:before{content:"\f044"}.fa-share-square-o:before{content:"\f045"}.fa-check-square-o:before{content:"\f046"}.fa-arrows:before{content:"\f047"}.fa-step-backward:before{content:"\f048"}.fa-fast-backward:before{content:"\f049"}.fa-backward:before{content:"\f04a"}.fa-play:before{content:"\f04b"}.fa-pause:before{content:"\f04c"}.fa-stop:before{content:"\f04d"}.fa-forward:before{content:"\f04e"}.fa-fast-forward:before{content:"\f050"}.fa-step-forward:before{content:"\f051"}.fa-eject:before{content:"\f052"}.fa-chevron-left:before{content:"\f053"}.fa-chevron-right:before{content:"\f054"}.fa-plus-circle:before{content:"\f055"}.fa-minus-circle:before{content:"\f056"}.fa-times-circle:before{content:"\f057"}.fa-check-circle:before{content:"\f058"}.fa-question-circle:before{content:"\f059"}.fa-info-circle:before{content:"\f05a"}.fa-crosshairs:before{content:"\f05b"}.fa-times-circle-o:before{content:"\f05c"}.fa-check-circle-o:before{content:"\f05d"}.fa-ban:before{content:"\f05e"}.fa-arrow-left:before{content:"\f060"}.fa-arrow-right:before{content:"\f061"}.fa-arrow-up:before{content:"\f062"}.fa-arrow-down:before{content:"\f063"}.fa-mail-forward:before,.fa-share:before{content:"\f064"}.fa-expand:before{content:"\f065"}.fa-compress:before{content:"\f066"}.fa-plus:before{content:"\f067"}.fa-minus:before{content:"\f068"}.fa-asterisk:before{content:"\f069"}.fa-exclamation-circle:before{content:"\f06a"}.fa-gift:before{content:"\f06b"}.fa-leaf:before{content:"\f06c"}.fa-fire:before{content:"\f06d"}.fa-eye:before{content:"\f06e"}.fa-eye-slash:before{content:"\f070"}.fa-warning:before,.fa-exclamation-triangle:before{content:"\f071"}.fa-plane:before{content:"\f072"}.fa-calendar:before{content:"\f073"}.fa-random:before{content:"\f074"}.fa-comment:before{content:"\f075"}.fa-magnet:before{content:"\f076"}.fa-chevron-up:before{content:"\f077"}.fa-chevron-down:before{content:"\f078"}.fa-retweet:before{content:"\f079"}.fa-shopping-cart:before{content:"\f07a"}.fa-folder:before{content:"\f07b"}.fa-folder-open:before{content:"\f07c"}.fa-arrows-v:before{content:"\f07d"}.fa-arrows-h:before{content:"\f07e"}.fa-bar-chart-o:before,.fa-bar-chart:before{content:"\f080"}.fa-twitter-square:before{content:"\f081"}.fa-facebook-square:before{content:"\f082"}.fa-camera-retro:before{content:"\f083"}.fa-key:before{content:"\f084"}.fa-gears:before,.fa-cogs:before{content:"\f085"}.fa-comments:before{content:"\f086"}.fa-thumbs-o-up:before{content:"\f087"}.fa-thumbs-o-down:before{content:"\f088"}.fa-star-half:before{content:"\f089"}.fa-heart-o:before{content:"\f08a"}.fa-sign-out:before{content:"\f08b"}.fa-linkedin-square:before{content:"\f08c"}.fa-thumb-tack:before{content:"\f08d"}.fa-external-link:before{content:"\f08e"}.fa-sign-in:before{content:"\f090"}.fa-trophy:before{content:"\f091"}.fa-github-square:before{content:"\f092"}.fa-upload:before{content:"\f093"}.fa-lemon-o:before{content:"\f094"}.fa-phone:before{content:"\f095"}.fa-square-o:before{content:"\f096"}.fa-bookmark-o:before{content:"\f097"}.fa-phone-square:before{content:"\f098"}.fa-twitter:before{content:"\f099"}.fa-facebook-f:before,.fa-facebook:before{content:"\f09a"}.fa-github:before{content:"\f09b"}.fa-unlock:before{content:"\f09c"}.fa-credit-card:before{content:"\f09d"}.fa-feed:before,.fa-rss:before{content:"\f09e"}.fa-hdd-o:before{content:"\f0a0"}.fa-bullhorn:before{content:"\f0a1"}.fa-bell:before{content:"\f0f3"}.fa-certificate:before{content:"\f0a3"}.fa-hand-o-right:before{content:"\f0a4"}.fa-hand-o-left:before{content:"\f0a5"}.fa-hand-o-up:before{content:"\f0a6"}.fa-hand-o-down:before{content:"\f0a7"}.fa-arrow-circle-left:before{content:"\f0a8"}.fa-arrow-circle-right:before{content:"\f0a9"}.fa-arrow-circle-up:before{content:"\f0aa"}.fa-arrow-circle-down:before{content:"\f0ab"}.fa-globe:before{content:"\f0ac"}.fa-wrench:before{content:"\f0ad"}.fa-tasks:before{content:"\f0ae"}.fa-filter:before{content:"\f0b0"}.fa-briefcase:before{content:"\f0b1"}.fa-arrows-alt:before{content:"\f0b2"}.fa-group:before,.fa-users:before{content:"\f0c0"}.fa-chain:before,.fa-link:before{content:"\f0c1"}.fa-cloud:before{content:"\f0c2"}.fa-flask:before{content:"\f0c3"}.fa-cut:before,.fa-scissors:before{content:"\f0c4"}.fa-copy:before,.fa-files-o:before{content:"\f0c5"}.fa-paperclip:before{content:"\f0c6"}.fa-save:before,.fa-floppy-o:before{content:"\f0c7"}.fa-square:before{content:"\f0c8"}.fa-navicon:before,.fa-reorder:before,.fa-bars:before{content:"\f0c9"}.fa-list-ul:before{content:"\f0ca"}.fa-list-ol:before{content:"\f0cb"}.fa-strikethrough:before{content:"\f0cc"}.fa-underline:before{content:"\f0cd"}.fa-table:before{content:"\f0ce"}.fa-magic:before{content:"\f0d0"}.fa-truck:before{content:"\f0d1"}.fa-pinterest:before{content:"\f0d2"}.fa-pinterest-square:before{content:"\f0d3"}.fa-google-plus-square:before{content:"\f0d4"}.fa-google-plus:before{content:"\f0d5"}.fa-money:before{content:"\f0d6"}.fa-caret-down:before{content:"\f0d7"}.fa-caret-up:before{content:"\f0d8"}.fa-caret-left:before{content:"\f0d9"}.fa-caret-right:before{content:"\f0da"}.fa-columns:before{content:"\f0db"}.fa-unsorted:before,.fa-sort:before{content:"\f0dc"}.fa-sort-down:before,.fa-sort-desc:before{content:"\f0dd"}.fa-sort-up:before,.fa-sort-asc:before{content:"\f0de"}.fa-envelope:before{content:"\f0e0"}.fa-linkedin:before{content:"\f0e1"}.fa-rotate-left:before,.fa-undo:before{content:"\f0e2"}.fa-legal:before,.fa-gavel:before{content:"\f0e3"}.fa-dashboard:before,.fa-tachometer:before{content:"\f0e4"}.fa-comment-o:before{content:"\f0e5"}.fa-comments-o:before{content:"\f0e6"}.fa-flash:before,.fa-bolt:before{content:"\f0e7"}.fa-sitemap:before{content:"\f0e8"}.fa-umbrella:before{content:"\f0e9"}.fa-paste:before,.fa-clipboard:before{content:"\f0ea"}.fa-lightbulb-o:before{content:"\f0eb"}.fa-exchange:before{content:"\f0ec"}.fa-cloud-download:before{content:"\f0ed"}.fa-cloud-upload:before{content:"\f0ee"}.fa-user-md:before{content:"\f0f0"}.fa-stethoscope:before{content:"\f0f1"}.fa-suitcase:before{content:"\f0f2"}.fa-bell-o:before{content:"\f0a2"}.fa-coffee:before{content:"\f0f4"}.fa-cutlery:before{content:"\f0f5"}.fa-file-text-o:before{content:"\f0f6"}.fa-building-o:before{content:"\f0f7"}.fa-hospital-o:before{content:"\f0f8"}.fa-ambulance:before{content:"\f0f9"}.fa-medkit:before{content:"\f0fa"}.fa-fighter-jet:before{content:"\f0fb"}.fa-beer:before{content:"\f0fc"}.fa-h-square:before{content:"\f0fd"}.fa-plus-square:before{content:"\f0fe"}.fa-angle-double-left:before{content:"\f100"}.fa-angle-double-right:before{content:"\f101"}.fa-angle-double-up:before{content:"\f102"}.fa-angle-double-down:before{content:"\f103"}.fa-angle-left:before{content:"\f104"}.fa-angle-right:before{content:"\f105"}.fa-angle-up:before{content:"\f106"}.fa-angle-down:before{content:"\f107"}.fa-desktop:before{content:"\f108"}.fa-laptop:before{content:"\f109"}.fa-tablet:before{content:"\f10a"}.fa-mobile-phone:before,.fa-mobile:before{content:"\f10b"}.fa-circle-o:before{content:"\f10c"}.fa-quote-left:before{content:"\f10d"}.fa-quote-right:before{content:"\f10e"}.fa-spinner:before{content:"\f110"}.fa-circle:before{content:"\f111"}.fa-mail-reply:before,.fa-reply:before{content:"\f112"}.fa-github-alt:before{content:"\f113"}.fa-folder-o:before{content:"\f114"}.fa-folder-open-o:before{content:"\f115"}.fa-smile-o:before{content:"\f118"}.fa-frown-o:before{content:"\f119"}.fa-meh-o:before{content:"\f11a"}.fa-gamepad:before{content:"\f11b"}.fa-keyboard-o:before{content:"\f11c"}.fa-flag-o:before{content:"\f11d"}.fa-flag-checkered:before{content:"\f11e"}.fa-terminal:before{content:"\f120"}.fa-code:before{content:"\f121"}.fa-mail-reply-all:before,.fa-reply-all:before{content:"\f122"}.fa-star-half-empty:before,.fa-star-half-full:before,.fa-star-half-o:before{content:"\f123"}.fa-location-arrow:before{content:"\f124"}.fa-crop:before{content:"\f125"}.fa-code-fork:before{content:"\f126"}.fa-unlink:before,.fa-chain-broken:before{content:"\f127"}.fa-question:before{content:"\f128"}.fa-info:before{content:"\f129"}.fa-exclamation:before{content:"\f12a"}.fa-superscript:before{content:"\f12b"}.fa-subscript:before{content:"\f12c"}.fa-eraser:before{content:"\f12d"}.fa-puzzle-piece:before{content:"\f12e"}.fa-microphone:before{content:"\f130"}.fa-microphone-slash:before{content:"\f131"}.fa-shield:before{content:"\f132"}.fa-calendar-o:before{content:"\f133"}.fa-fire-extinguisher:before{content:"\f134"}.fa-rocket:before{content:"\f135"}.fa-maxcdn:before{content:"\f136"}.fa-chevron-circle-left:before{content:"\f137"}.fa-chevron-circle-right:before{content:"\f138"}.fa-chevron-circle-up:before{content:"\f139"}.fa-chevron-circle-down:before{content:"\f13a"}.fa-html5:before{content:"\f13b"}.fa-css3:before{content:"\f13c"}.fa-anchor:before{content:"\f13d"}.fa-unlock-alt:before{content:"\f13e"}.fa-bullseye:before{content:"\f140"}.fa-ellipsis-h:before{content:"\f141"}.fa-ellipsis-v:before{content:"\f142"}.fa-rss-square:before{content:"\f143"}.fa-play-circle:before{content:"\f144"}.fa-ticket:before{content:"\f145"}.fa-minus-square:before{content:"\f146"}.fa-minus-square-o:before{content:"\f147"}.fa-level-up:before{content:"\f148"}.fa-level-down:before{content:"\f149"}.fa-check-square:before{content:"\f14a"}.fa-pencil-square:before{content:"\f14b"}.fa-external-link-square:before{content:"\f14c"}.fa-share-square:before{content:"\f14d"}.fa-compass:before{content:"\f14e"}.fa-toggle-down:before,.fa-caret-square-o-down:before{content:"\f150"}.fa-toggle-up:before,.fa-caret-square-o-up:before{content:"\f151"}.fa-toggle-right:before,.fa-caret-square-o-right:before{content:"\f152"}.fa-euro:before,.fa-eur:before{content:"\f153"}.fa-gbp:before{content:"\f154"}.fa-dollar:before,.fa-usd:before{content:"\f155"}.fa-rupee:before,.fa-inr:before{content:"\f156"}.fa-cny:before,.fa-rmb:before,.fa-yen:before,.fa-jpy:before{content:"\f157"}.fa-ruble:before,.fa-rouble:before,.fa-rub:before{content:"\f158"}.fa-won:before,.fa-krw:before{content:"\f159"}.fa-bitcoin:before,.fa-btc:before{content:"\f15a"}.fa-file:before{content:"\f15b"}.fa-file-text:before{content:"\f15c"}.fa-sort-alpha-asc:before{content:"\f15d"}.fa-sort-alpha-desc:before{content:"\f15e"}.fa-sort-amount-asc:before{content:"\f160"}.fa-sort-amount-desc:before{content:"\f161"}.fa-sort-numeric-asc:before{content:"\f162"}.fa-sort-numeric-desc:before{content:"\f163"}.fa-thumbs-up:before{content:"\f164"}.fa-thumbs-down:before{content:"\f165"}.fa-youtube-square:before{content:"\f166"}.fa-youtube:before{content:"\f167"}.fa-xing:before{content:"\f168"}.fa-xing-square:before{content:"\f169"}.fa-youtube-play:before{content:"\f16a"}.fa-dropbox:before{content:"\f16b"}.fa-stack-overflow:before{content:"\f16c"}.fa-instagram:before{content:"\f16d"}.fa-flickr:before{content:"\f16e"}.fa-adn:before{content:"\f170"}.fa-bitbucket:before{content:"\f171"}.fa-bitbucket-square:before{content:"\f172"}.fa-tumblr:before{content:"\f173"}.fa-tumblr-square:before{content:"\f174"}.fa-long-arrow-down:before{content:"\f175"}.fa-long-arrow-up:before{content:"\f176"}.fa-long-arrow-left:before{content:"\f177"}.fa-long-arrow-right:before{content:"\f178"}.fa-apple:before{content:"\f179"}.fa-windows:before{content:"\f17a"}.fa-android:before{content:"\f17b"}.fa-linux:before{content:"\f17c"}.fa-dribbble:before{content:"\f17d"}.fa-skype:before{content:"\f17e"}.fa-foursquare:before{content:"\f180"}.fa-trello:before{content:"\f181"}.fa-female:before{content:"\f182"}.fa-male:before{content:"\f183"}.fa-gittip:before,.fa-gratipay:before{content:"\f184"}.fa-sun-o:before{content:"\f185"}.fa-moon-o:before{content:"\f186"}.fa-archive:before{content:"\f187"}.fa-bug:before{content:"\f188"}.fa-vk:before{content:"\f189"}.fa-weibo:before{content:"\f18a"}.fa-renren:before{content:"\f18b"}.fa-pagelines:before{content:"\f18c"}.fa-stack-exchange:before{content:"\f18d"}.fa-arrow-circle-o-right:before{content:"\f18e"}.fa-arrow-circle-o-left:before{content:"\f190"}.fa-toggle-left:before,.fa-caret-square-o-left:before{content:"\f191"}.fa-dot-circle-o:before{content:"\f192"}.fa-wheelchair:before{content:"\f193"}.fa-vimeo-square:before{content:"\f194"}.fa-turkish-lira:before,.fa-try:before{content:"\f195"}.fa-plus-square-o:before{content:"\f196"}.fa-space-shuttle:before{content:"\f197"}.fa-slack:before{content:"\f198"}.fa-envelope-square:before{content:"\f199"}.fa-wordpress:before{content:"\f19a"}.fa-openid:before{content:"\f19b"}.fa-institution:before,.fa-bank:before,.fa-university:before{content:"\f19c"}.fa-mortar-board:before,.fa-graduation-cap:before{content:"\f19d"}.fa-yahoo:before{content:"\f19e"}.fa-google:before{content:"\f1a0"}.fa-reddit:before{content:"\f1a1"}.fa-reddit-square:before{content:"\f1a2"}.fa-stumbleupon-circle:before{content:"\f1a3"}.fa-stumbleupon:before{content:"\f1a4"}.fa-delicious:before{content:"\f1a5"}.fa-digg:before{content:"\f1a6"}.fa-pied-piper-pp:before{content:"\f1a7"}.fa-pied-piper-alt:before{content:"\f1a8"}.fa-drupal:before{content:"\f1a9"}.fa-joomla:before{content:"\f1aa"}.fa-language:before{content:"\f1ab"}.fa-fax:before{content:"\f1ac"}.fa-building:before{content:"\f1ad"}.fa-child:before{content:"\f1ae"}.fa-paw:before{content:"\f1b0"}.fa-spoon:before{content:"\f1b1"}.fa-cube:before{content:"\f1b2"}.fa-cubes:before{content:"\f1b3"}.fa-behance:before{content:"\f1b4"}.fa-behance-square:before{content:"\f1b5"}.fa-steam:before{content:"\f1b6"}.fa-steam-square:before{content:"\f1b7"}.fa-recycle:before{content:"\f1b8"}.fa-automobile:before,.fa-car:before{content:"\f1b9"}.fa-cab:before,.fa-taxi:before{content:"\f1ba"}.fa-tree:before{content:"\f1bb"}.fa-spotify:before{content:"\f1bc"}.fa-deviantart:before{content:"\f1bd"}.fa-soundcloud:before{content:"\f1be"}.fa-database:before{content:"\f1c0"}.fa-file-pdf-o:before{content:"\f1c1"}.fa-file-word-o:before{content:"\f1c2"}.fa-file-excel-o:before{content:"\f1c3"}.fa-file-powerpoint-o:before{content:"\f1c4"}.fa-file-photo-o:before,.fa-file-picture-o:before,.fa-file-image-o:before{content:"\f1c5"}.fa-file-zip-o:before,.fa-file-archive-o:before{content:"\f1c6"}.fa-file-sound-o:before,.fa-file-audio-o:before{content:"\f1c7"}.fa-file-movie-o:before,.fa-file-video-o:before{content:"\f1c8"}.fa-file-code-o:before{content:"\f1c9"}.fa-vine:before{content:"\f1ca"}.fa-codepen:before{content:"\f1cb"}.fa-jsfiddle:before{content:"\f1cc"}.fa-life-bouy:before,.fa-life-buoy:before,.fa-life-saver:before,.fa-support:before,.fa-life-ring:before{content:"\f1cd"}.fa-circle-o-notch:before{content:"\f1ce"}.fa-ra:before,.fa-resistance:before,.fa-rebel:before{content:"\f1d0"}.fa-ge:before,.fa-empire:before{content:"\f1d1"}.fa-git-square:before{content:"\f1d2"}.fa-git:before{content:"\f1d3"}.fa-y-combinator-square:before,.fa-yc-square:before,.fa-hacker-news:before{content:"\f1d4"}.fa-tencent-weibo:before{content:"\f1d5"}.fa-qq:before{content:"\f1d6"}.fa-wechat:before,.fa-weixin:before{content:"\f1d7"}.fa-send:before,.fa-paper-plane:before{content:"\f1d8"}.fa-send-o:before,.fa-paper-plane-o:before{content:"\f1d9"}.fa-history:before{content:"\f1da"}.fa-circle-thin:before{content:"\f1db"}.fa-header:before{content:"\f1dc"}.fa-paragraph:before{content:"\f1dd"}.fa-sliders:before{content:"\f1de"}.fa-share-alt:before{content:"\f1e0"}.fa-share-alt-square:before{content:"\f1e1"}.fa-bomb:before{content:"\f1e2"}.fa-soccer-ball-o:before,.fa-futbol-o:before{content:"\f1e3"}.fa-tty:before{content:"\f1e4"}.fa-binoculars:before{content:"\f1e5"}.fa-plug:before{content:"\f1e6"}.fa-slideshare:before{content:"\f1e7"}.fa-twitch:before{content:"\f1e8"}.fa-yelp:before{content:"\f1e9"}.fa-newspaper-o:before{content:"\f1ea"}.fa-wifi:before{content:"\f1eb"}.fa-calculator:before{content:"\f1ec"}.fa-paypal:before{content:"\f1ed"}.fa-google-wallet:before{content:"\f1ee"}.fa-cc-visa:before{content:"\f1f0"}.fa-cc-mastercard:before{content:"\f1f1"}.fa-cc-discover:before{content:"\f1f2"}.fa-cc-amex:before{content:"\f1f3"}.fa-cc-paypal:before{content:"\f1f4"}.fa-cc-stripe:before{content:"\f1f5"}.fa-bell-slash:before{content:"\f1f6"}.fa-bell-slash-o:before{content:"\f1f7"}.fa-trash:before{content:"\f1f8"}.fa-copyright:before{content:"\f1f9"}.fa-at:before{content:"\f1fa"}.fa-eyedropper:before{content:"\f1fb"}.fa-paint-brush:before{content:"\f1fc"}.fa-birthday-cake:before{content:"\f1fd"}.fa-area-chart:before{content:"\f1fe"}.fa-pie-chart:before{content:"\f200"}.fa-line-chart:before{content:"\f201"}.fa-lastfm:before{content:"\f202"}.fa-lastfm-square:before{content:"\f203"}.fa-toggle-off:before{content:"\f204"}.fa-toggle-on:before{content:"\f205"}.fa-bicycle:before{content:"\f206"}.fa-bus:before{content:"\f207"}.fa-ioxhost:before{content:"\f208"}.fa-angellist:before{content:"\f209"}.fa-cc:before{content:"\f20a"}.fa-shekel:before,.fa-sheqel:before,.fa-ils:before{content:"\f20b"}.fa-meanpath:before{content:"\f20c"}.fa-buysellads:before{content:"\f20d"}.fa-connectdevelop:before{content:"\f20e"}.fa-dashcube:before{content:"\f210"}.fa-forumbee:before{content:"\f211"}.fa-leanpub:before{content:"\f212"}.fa-sellsy:before{content:"\f213"}.fa-shirtsinbulk:before{content:"\f214"}.fa-simplybuilt:before{content:"\f215"}.fa-skyatlas:before{content:"\f216"}.fa-cart-plus:before{content:"\f217"}.fa-cart-arrow-down:before{content:"\f218"}.fa-diamond:before{content:"\f219"}.fa-ship:before{content:"\f21a"}.fa-user-secret:before{content:"\f21b"}.fa-motorcycle:before{content:"\f21c"}.fa-street-view:before{content:"\f21d"}.fa-heartbeat:before{content:"\f21e"}.fa-venus:before{content:"\f221"}.fa-mars:before{content:"\f222"}.fa-mercury:before{content:"\f223"}.fa-intersex:before,.fa-transgender:before{content:"\f224"}.fa-transgender-alt:before{content:"\f225"}.fa-venus-double:before{content:"\f226"}.fa-mars-double:before{content:"\f227"}.fa-venus-mars:before{content:"\f228"}.fa-mars-stroke:before{content:"\f229"}.fa-mars-stroke-v:before{content:"\f22a"}.fa-mars-stroke-h:before{content:"\f22b"}.fa-neuter:before{content:"\f22c"}.fa-genderless:before{content:"\f22d"}.fa-facebook-official:before{content:"\f230"}.fa-pinterest-p:before{content:"\f231"}.fa-whatsapp:before{content:"\f232"}.fa-server:before{content:"\f233"}.fa-user-plus:before{content:"\f234"}.fa-user-times:before{content:"\f235"}.fa-hotel:before,.fa-bed:before{content:"\f236"}.fa-viacoin:before{content:"\f237"}.fa-train:before{content:"\f238"}.fa-subway:before{content:"\f239"}.fa-medium:before{content:"\f23a"}.fa-yc:before,.fa-y-combinator:before{content:"\f23b"}.fa-optin-monster:before{content:"\f23c"}.fa-opencart:before{content:"\f23d"}.fa-expeditedssl:before{content:"\f23e"}.fa-battery-4:before,.fa-battery:before,.fa-battery-full:before{content:"\f240"}.fa-battery-3:before,.fa-battery-three-quarters:before{content:"\f241"}.fa-battery-2:before,.fa-battery-half:before{content:"\f242"}.fa-battery-1:before,.fa-battery-quarter:before{content:"\f243"}.fa-battery-0:before,.fa-battery-empty:before{content:"\f244"}.fa-mouse-pointer:before{content:"\f245"}.fa-i-cursor:before{content:"\f246"}.fa-object-group:before{content:"\f247"}.fa-object-ungroup:before{content:"\f248"}.fa-sticky-note:before{content:"\f249"}.fa-sticky-note-o:before{content:"\f24a"}.fa-cc-jcb:before{content:"\f24b"}.fa-cc-diners-club:before{content:"\f24c"}.fa-clone:before{content:"\f24d"}.fa-balance-scale:before{content:"\f24e"}.fa-hourglass-o:before{content:"\f250"}.fa-hourglass-1:before,.fa-hourglass-start:before{content:"\f251"}.fa-hourglass-2:before,.fa-hourglass-half:before{content:"\f252"}.fa-hourglass-3:before,.fa-hourglass-end:before{content:"\f253"}.fa-hourglass:before{content:"\f254"}.fa-hand-grab-o:before,.fa-hand-rock-o:before{content:"\f255"}.fa-hand-stop-o:before,.fa-hand-paper-o:before{content:"\f256"}.fa-hand-scissors-o:before{content:"\f257"}.fa-hand-lizard-o:before{content:"\f258"}.fa-hand-spock-o:before{content:"\f259"}.fa-hand-pointer-o:before{content:"\f25a"}.fa-hand-peace-o:before{content:"\f25b"}.fa-trademark:before{content:"\f25c"}.fa-registered:before{content:"\f25d"}.fa-creative-commons:before{content:"\f25e"}.fa-gg:before{content:"\f260"}.fa-gg-circle:before{content:"\f261"}.fa-tripadvisor:before{content:"\f262"}.fa-odnoklassniki:before{content:"\f263"}.fa-odnoklassniki-square:before{content:"\f264"}.fa-get-pocket:before{content:"\f265"}.fa-wikipedia-w:before{content:"\f266"}.fa-safari:before{content:"\f267"}.fa-chrome:before{content:"\f268"}.fa-firefox:before{content:"\f269"}.fa-opera:before{content:"\f26a"}.fa-internet-explorer:before{content:"\f26b"}.fa-tv:before,.fa-television:before{content:"\f26c"}.fa-contao:before{content:"\f26d"}.fa-500px:before{content:"\f26e"}.fa-amazon:before{content:"\f270"}.fa-calendar-plus-o:before{content:"\f271"}.fa-calendar-minus-o:before{content:"\f272"}.fa-calendar-times-o:before{content:"\f273"}.fa-calendar-check-o:before{content:"\f274"}.fa-industry:before{content:"\f275"}.fa-map-pin:before{content:"\f276"}.fa-map-signs:before{content:"\f277"}.fa-map-o:before{content:"\f278"}.fa-map:before{content:"\f279"}.fa-commenting:before{content:"\f27a"}.fa-commenting-o:before{content:"\f27b"}.fa-houzz:before{content:"\f27c"}.fa-vimeo:before{content:"\f27d"}.fa-black-tie:before{content:"\f27e"}.fa-fonticons:before{content:"\f280"}.fa-reddit-alien:before{content:"\f281"}.fa-edge:before{content:"\f282"}.fa-credit-card-alt:before{content:"\f283"}.fa-codiepie:before{content:"\f284"}.fa-modx:before{content:"\f285"}.fa-fort-awesome:before{content:"\f286"}.fa-usb:before{content:"\f287"}.fa-product-hunt:before{content:"\f288"}.fa-mixcloud:before{content:"\f289"}.fa-scribd:before{content:"\f28a"}.fa-pause-circle:before{content:"\f28b"}.fa-pause-circle-o:before{content:"\f28c"}.fa-stop-circle:before{content:"\f28d"}.fa-stop-circle-o:before{content:"\f28e"}.fa-shopping-bag:before{content:"\f290"}.fa-shopping-basket:before{content:"\f291"}.fa-hashtag:before{content:"\f292"}.fa-bluetooth:before{content:"\f293"}.fa-bluetooth-b:before{content:"\f294"}.fa-percent:before{content:"\f295"}.fa-gitlab:before{content:"\f296"}.fa-wpbeginner:before{content:"\f297"}.fa-wpforms:before{content:"\f298"}.fa-envira:before{content:"\f299"}.fa-universal-access:before{content:"\f29a"}.fa-wheelchair-alt:before{content:"\f29b"}.fa-question-circle-o:before{content:"\f29c"}.fa-blind:before{content:"\f29d"}.fa-audio-description:before{content:"\f29e"}.fa-volume-control-phone:before{content:"\f2a0"}.fa-braille:before{content:"\f2a1"}.fa-assistive-listening-systems:before{content:"\f2a2"}.fa-asl-interpreting:before,.fa-american-sign-language-interpreting:before{content:"\f2a3"}.fa-deafness:before,.fa-hard-of-hearing:before,.fa-deaf:before{content:"\f2a4"}.fa-glide:before{content:"\f2a5"}.fa-glide-g:before{content:"\f2a6"}.fa-signing:before,.fa-sign-language:before{content:"\f2a7"}.fa-low-vision:before{content:"\f2a8"}.fa-viadeo:before{content:"\f2a9"}.fa-viadeo-square:before{content:"\f2aa"}.fa-snapchat:before{content:"\f2ab"}.fa-snapchat-ghost:before{content:"\f2ac"}.fa-snapchat-square:before{content:"\f2ad"}.fa-pied-piper:before{content:"\f2ae"}.fa-first-order:before{content:"\f2b0"}.fa-yoast:before{content:"\f2b1"}.fa-themeisle:before{content:"\f2b2"}.fa-google-plus-circle:before,.fa-google-plus-official:before{content:"\f2b3"}.fa-fa:before,.fa-font-awesome:before{content:"\f2b4"}.fa-handshake-o:before{content:"\f2b5"}.fa-envelope-open:before{content:"\f2b6"}.fa-envelope-open-o:before{content:"\f2b7"}.fa-linode:before{content:"\f2b8"}.fa-address-book:before{content:"\f2b9"}.fa-address-book-o:before{content:"\f2ba"}.fa-vcard:before,.fa-address-card:before{content:"\f2bb"}.fa-vcard-o:before,.fa-address-card-o:before{content:"\f2bc"}.fa-user-circle:before{content:"\f2bd"}.fa-user-circle-o:before{content:"\f2be"}.fa-user-o:before{content:"\f2c0"}.fa-id-badge:before{content:"\f2c1"}.fa-drivers-license:before,.fa-id-card:before{content:"\f2c2"}.fa-drivers-license-o:before,.fa-id-card-o:before{content:"\f2c3"}.fa-quora:before{content:"\f2c4"}.fa-free-code-camp:before{content:"\f2c5"}.fa-telegram:before{content:"\f2c6"}.fa-thermometer-4:before,.fa-thermometer:before,.fa-thermometer-full:before{content:"\f2c7"}.fa-thermometer-3:before,.fa-thermometer-three-quarters:before{content:"\f2c8"}.fa-thermometer-2:before,.fa-thermometer-half:before{content:"\f2c9"}.fa-thermometer-1:before,.fa-thermometer-quarter:before{content:"\f2ca"}.fa-thermometer-0:before,.fa-thermometer-empty:before{content:"\f2cb"}.fa-shower:before{content:"\f2cc"}.fa-bathtub:before,.fa-s15:before,.fa-bath:before{content:"\f2cd"}.fa-podcast:before{content:"\f2ce"}.fa-window-maximize:before{content:"\f2d0"}.fa-window-minimize:before{content:"\f2d1"}.fa-window-restore:before{content:"\f2d2"}.fa-times-rectangle:before,.fa-window-close:before{content:"\f2d3"}.fa-times-rectangle-o:before,.fa-window-close-o:before{content:"\f2d4"}.fa-bandcamp:before{content:"\f2d5"}.fa-grav:before{content:"\f2d6"}.fa-etsy:before{content:"\f2d7"}.fa-imdb:before{content:"\f2d8"}.fa-ravelry:before{content:"\f2d9"}.fa-eercast:before{content:"\f2da"}.fa-microchip:before{content:"\f2db"}.fa-snowflake-o:before{content:"\f2dc"}.fa-superpowers:before{content:"\f2dd"}.fa-wpexplorer:before{content:"\f2de"}.fa-meetup:before{content:"\f2e0"}.sr-only{position:absolute;width:1px;height:1px;padding:0;margin:-1px;overflow:hidden;clip:rect(0, 0, 0, 0);border:0}.sr-only-focusable:active,.sr-only-focusable:focus{position:static;width:auto;height:auto;margin:0;overflow:visible;clip:auto}
diff --git a/plugins/fontawesome/fonts/FontAwesome.otf b/plugins/fontawesome/fonts/FontAwesome.otf
new file mode 100644
index 00000000..401ec0f3
Binary files /dev/null and b/plugins/fontawesome/fonts/FontAwesome.otf differ
diff --git a/plugins/fontawesome/fonts/fontawesome-webfont.eot b/plugins/fontawesome/fonts/fontawesome-webfont.eot
new file mode 100644
index 00000000..e9f60ca9
Binary files /dev/null and b/plugins/fontawesome/fonts/fontawesome-webfont.eot differ
diff --git a/plugins/fontawesome/fonts/fontawesome-webfont.svg b/plugins/fontawesome/fonts/fontawesome-webfont.svg
new file mode 100644
index 00000000..855c845e
--- /dev/null
+++ b/plugins/fontawesome/fonts/fontawesome-webfont.svg
@@ -0,0 +1,2671 @@
+<?xml version="1.0" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd" >
+<svg>
+<metadata>
+Created by FontForge 20120731 at Mon Oct 24 17:37:40 2016
+ By ,,,
+Copyright Dave Gandy 2016. All rights reserved.
+</metadata>
+<defs>
+<font id="FontAwesome" horiz-adv-x="1536" >
+  <font-face 
+    font-family="FontAwesome"
+    font-weight="400"
+    font-stretch="normal"
+    units-per-em="1792"
+    panose-1="0 0 0 0 0 0 0 0 0 0"
+    ascent="1536"
+    descent="-256"
+    bbox="-1.02083 -256.962 2304.6 1537.02"
+    underline-thickness="0"
+    underline-position="0"
+    unicode-range="U+0020-F500"
+  />
+<missing-glyph horiz-adv-x="896" 
+d="M224 112h448v1312h-448v-1312zM112 0v1536h672v-1536h-672z" />
+    <glyph glyph-name=".notdef" horiz-adv-x="896" 
+d="M224 112h448v1312h-448v-1312zM112 0v1536h672v-1536h-672z" />
+    <glyph glyph-name=".null" horiz-adv-x="0" 
+ />
+    <glyph glyph-name="nonmarkingreturn" horiz-adv-x="597" 
+ />
+    <glyph glyph-name="space" unicode=" " horiz-adv-x="448" 
+ />
+    <glyph glyph-name="dieresis" unicode="&#xa8;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="copyright" unicode="&#xa9;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="registered" unicode="&#xae;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="acute" unicode="&#xb4;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="AE" unicode="&#xc6;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="Oslash" unicode="&#xd8;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="trademark" unicode="&#x2122;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="infinity" unicode="&#x221e;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="notequal" unicode="&#x2260;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="glass" unicode="&#xf000;" horiz-adv-x="1792" 
+d="M1699 1350q0 -35 -43 -78l-632 -632v-768h320q26 0 45 -19t19 -45t-19 -45t-45 -19h-896q-26 0 -45 19t-19 45t19 45t45 19h320v768l-632 632q-43 43 -43 78q0 23 18 36.5t38 17.5t43 4h1408q23 0 43 -4t38 -17.5t18 -36.5z" />
+    <glyph glyph-name="music" unicode="&#xf001;" 
+d="M1536 1312v-1120q0 -50 -34 -89t-86 -60.5t-103.5 -32t-96.5 -10.5t-96.5 10.5t-103.5 32t-86 60.5t-34 89t34 89t86 60.5t103.5 32t96.5 10.5q105 0 192 -39v537l-768 -237v-709q0 -50 -34 -89t-86 -60.5t-103.5 -32t-96.5 -10.5t-96.5 10.5t-103.5 32t-86 60.5t-34 89
+t34 89t86 60.5t103.5 32t96.5 10.5q105 0 192 -39v967q0 31 19 56.5t49 35.5l832 256q12 4 28 4q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="search" unicode="&#xf002;" horiz-adv-x="1664" 
+d="M1152 704q0 185 -131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5t316.5 131.5t131.5 316.5zM1664 -128q0 -52 -38 -90t-90 -38q-54 0 -90 38l-343 342q-179 -124 -399 -124q-143 0 -273.5 55.5t-225 150t-150 225t-55.5 273.5
+t55.5 273.5t150 225t225 150t273.5 55.5t273.5 -55.5t225 -150t150 -225t55.5 -273.5q0 -220 -124 -399l343 -343q37 -37 37 -90z" />
+    <glyph glyph-name="envelope" unicode="&#xf003;" horiz-adv-x="1792" 
+d="M1664 32v768q-32 -36 -69 -66q-268 -206 -426 -338q-51 -43 -83 -67t-86.5 -48.5t-102.5 -24.5h-1h-1q-48 0 -102.5 24.5t-86.5 48.5t-83 67q-158 132 -426 338q-37 30 -69 66v-768q0 -13 9.5 -22.5t22.5 -9.5h1472q13 0 22.5 9.5t9.5 22.5zM1664 1083v11v13.5t-0.5 13
+t-3 12.5t-5.5 9t-9 7.5t-14 2.5h-1472q-13 0 -22.5 -9.5t-9.5 -22.5q0 -168 147 -284q193 -152 401 -317q6 -5 35 -29.5t46 -37.5t44.5 -31.5t50.5 -27.5t43 -9h1h1q20 0 43 9t50.5 27.5t44.5 31.5t46 37.5t35 29.5q208 165 401 317q54 43 100.5 115.5t46.5 131.5z
+M1792 1120v-1088q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1472q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="heart" unicode="&#xf004;" horiz-adv-x="1792" 
+d="M896 -128q-26 0 -44 18l-624 602q-10 8 -27.5 26t-55.5 65.5t-68 97.5t-53.5 121t-23.5 138q0 220 127 344t351 124q62 0 126.5 -21.5t120 -58t95.5 -68.5t76 -68q36 36 76 68t95.5 68.5t120 58t126.5 21.5q224 0 351 -124t127 -344q0 -221 -229 -450l-623 -600
+q-18 -18 -44 -18z" />
+    <glyph glyph-name="star" unicode="&#xf005;" horiz-adv-x="1664" 
+d="M1664 889q0 -22 -26 -48l-363 -354l86 -500q1 -7 1 -20q0 -21 -10.5 -35.5t-30.5 -14.5q-19 0 -40 12l-449 236l-449 -236q-22 -12 -40 -12q-21 0 -31.5 14.5t-10.5 35.5q0 6 2 20l86 500l-364 354q-25 27 -25 48q0 37 56 46l502 73l225 455q19 41 49 41t49 -41l225 -455
+l502 -73q56 -9 56 -46z" />
+    <glyph glyph-name="star_empty" unicode="&#xf006;" horiz-adv-x="1664" 
+d="M1137 532l306 297l-422 62l-189 382l-189 -382l-422 -62l306 -297l-73 -421l378 199l377 -199zM1664 889q0 -22 -26 -48l-363 -354l86 -500q1 -7 1 -20q0 -50 -41 -50q-19 0 -40 12l-449 236l-449 -236q-22 -12 -40 -12q-21 0 -31.5 14.5t-10.5 35.5q0 6 2 20l86 500
+l-364 354q-25 27 -25 48q0 37 56 46l502 73l225 455q19 41 49 41t49 -41l225 -455l502 -73q56 -9 56 -46z" />
+    <glyph glyph-name="user" unicode="&#xf007;" horiz-adv-x="1280" 
+d="M1280 137q0 -109 -62.5 -187t-150.5 -78h-854q-88 0 -150.5 78t-62.5 187q0 85 8.5 160.5t31.5 152t58.5 131t94 89t134.5 34.5q131 -128 313 -128t313 128q76 0 134.5 -34.5t94 -89t58.5 -131t31.5 -152t8.5 -160.5zM1024 1024q0 -159 -112.5 -271.5t-271.5 -112.5
+t-271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5t271.5 -112.5t112.5 -271.5z" />
+    <glyph glyph-name="film" unicode="&#xf008;" horiz-adv-x="1920" 
+d="M384 -64v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM384 320v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM384 704v128q0 26 -19 45t-45 19h-128
+q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1408 -64v512q0 26 -19 45t-45 19h-768q-26 0 -45 -19t-19 -45v-512q0 -26 19 -45t45 -19h768q26 0 45 19t19 45zM384 1088v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45
+t45 -19h128q26 0 45 19t19 45zM1792 -64v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1408 704v512q0 26 -19 45t-45 19h-768q-26 0 -45 -19t-19 -45v-512q0 -26 19 -45t45 -19h768q26 0 45 19t19 45zM1792 320v128
+q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1792 704v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1792 1088v128q0 26 -19 45t-45 19h-128q-26 0 -45 -19
+t-19 -45v-128q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1920 1248v-1344q0 -66 -47 -113t-113 -47h-1600q-66 0 -113 47t-47 113v1344q0 66 47 113t113 47h1600q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="th_large" unicode="&#xf009;" horiz-adv-x="1664" 
+d="M768 512v-384q0 -52 -38 -90t-90 -38h-512q-52 0 -90 38t-38 90v384q0 52 38 90t90 38h512q52 0 90 -38t38 -90zM768 1280v-384q0 -52 -38 -90t-90 -38h-512q-52 0 -90 38t-38 90v384q0 52 38 90t90 38h512q52 0 90 -38t38 -90zM1664 512v-384q0 -52 -38 -90t-90 -38
+h-512q-52 0 -90 38t-38 90v384q0 52 38 90t90 38h512q52 0 90 -38t38 -90zM1664 1280v-384q0 -52 -38 -90t-90 -38h-512q-52 0 -90 38t-38 90v384q0 52 38 90t90 38h512q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="th" unicode="&#xf00a;" horiz-adv-x="1792" 
+d="M512 288v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM512 800v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1152 288v-192q0 -40 -28 -68t-68 -28h-320
+q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM512 1312v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1152 800v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28
+h320q40 0 68 -28t28 -68zM1792 288v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1152 1312v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1792 800v-192
+q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1792 1312v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="th_list" unicode="&#xf00b;" horiz-adv-x="1792" 
+d="M512 288v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM512 800v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1792 288v-192q0 -40 -28 -68t-68 -28h-960
+q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h960q40 0 68 -28t28 -68zM512 1312v-192q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h320q40 0 68 -28t28 -68zM1792 800v-192q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v192q0 40 28 68t68 28
+h960q40 0 68 -28t28 -68zM1792 1312v-192q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h960q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="ok" unicode="&#xf00c;" horiz-adv-x="1792" 
+d="M1671 970q0 -40 -28 -68l-724 -724l-136 -136q-28 -28 -68 -28t-68 28l-136 136l-362 362q-28 28 -28 68t28 68l136 136q28 28 68 28t68 -28l294 -295l656 657q28 28 68 28t68 -28l136 -136q28 -28 28 -68z" />
+    <glyph glyph-name="remove" unicode="&#xf00d;" horiz-adv-x="1408" 
+d="M1298 214q0 -40 -28 -68l-136 -136q-28 -28 -68 -28t-68 28l-294 294l-294 -294q-28 -28 -68 -28t-68 28l-136 136q-28 28 -28 68t28 68l294 294l-294 294q-28 28 -28 68t28 68l136 136q28 28 68 28t68 -28l294 -294l294 294q28 28 68 28t68 -28l136 -136q28 -28 28 -68
+t-28 -68l-294 -294l294 -294q28 -28 28 -68z" />
+    <glyph glyph-name="zoom_in" unicode="&#xf00e;" horiz-adv-x="1664" 
+d="M1024 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-224v-224q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v224h-224q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h224v224q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5v-224h224
+q13 0 22.5 -9.5t9.5 -22.5zM1152 704q0 185 -131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5t316.5 131.5t131.5 316.5zM1664 -128q0 -53 -37.5 -90.5t-90.5 -37.5q-54 0 -90 38l-343 342q-179 -124 -399 -124q-143 0 -273.5 55.5
+t-225 150t-150 225t-55.5 273.5t55.5 273.5t150 225t225 150t273.5 55.5t273.5 -55.5t225 -150t150 -225t55.5 -273.5q0 -220 -124 -399l343 -343q37 -37 37 -90z" />
+    <glyph glyph-name="zoom_out" unicode="&#xf010;" horiz-adv-x="1664" 
+d="M1024 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-576q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h576q13 0 22.5 -9.5t9.5 -22.5zM1152 704q0 185 -131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5t316.5 131.5t131.5 316.5z
+M1664 -128q0 -53 -37.5 -90.5t-90.5 -37.5q-54 0 -90 38l-343 342q-179 -124 -399 -124q-143 0 -273.5 55.5t-225 150t-150 225t-55.5 273.5t55.5 273.5t150 225t225 150t273.5 55.5t273.5 -55.5t225 -150t150 -225t55.5 -273.5q0 -220 -124 -399l343 -343q37 -37 37 -90z
+" />
+    <glyph glyph-name="off" unicode="&#xf011;" 
+d="M1536 640q0 -156 -61 -298t-164 -245t-245 -164t-298 -61t-298 61t-245 164t-164 245t-61 298q0 182 80.5 343t226.5 270q43 32 95.5 25t83.5 -50q32 -42 24.5 -94.5t-49.5 -84.5q-98 -74 -151.5 -181t-53.5 -228q0 -104 40.5 -198.5t109.5 -163.5t163.5 -109.5
+t198.5 -40.5t198.5 40.5t163.5 109.5t109.5 163.5t40.5 198.5q0 121 -53.5 228t-151.5 181q-42 32 -49.5 84.5t24.5 94.5q31 43 84 50t95 -25q146 -109 226.5 -270t80.5 -343zM896 1408v-640q0 -52 -38 -90t-90 -38t-90 38t-38 90v640q0 52 38 90t90 38t90 -38t38 -90z" />
+    <glyph glyph-name="signal" unicode="&#xf012;" horiz-adv-x="1792" 
+d="M256 96v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM640 224v-320q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v320q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1024 480v-576q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23
+v576q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1408 864v-960q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v960q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1792 1376v-1472q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v1472q0 14 9 23t23 9h192q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="cog" unicode="&#xf013;" 
+d="M1024 640q0 106 -75 181t-181 75t-181 -75t-75 -181t75 -181t181 -75t181 75t75 181zM1536 749v-222q0 -12 -8 -23t-20 -13l-185 -28q-19 -54 -39 -91q35 -50 107 -138q10 -12 10 -25t-9 -23q-27 -37 -99 -108t-94 -71q-12 0 -26 9l-138 108q-44 -23 -91 -38
+q-16 -136 -29 -186q-7 -28 -36 -28h-222q-14 0 -24.5 8.5t-11.5 21.5l-28 184q-49 16 -90 37l-141 -107q-10 -9 -25 -9q-14 0 -25 11q-126 114 -165 168q-7 10 -7 23q0 12 8 23q15 21 51 66.5t54 70.5q-27 50 -41 99l-183 27q-13 2 -21 12.5t-8 23.5v222q0 12 8 23t19 13
+l186 28q14 46 39 92q-40 57 -107 138q-10 12 -10 24q0 10 9 23q26 36 98.5 107.5t94.5 71.5q13 0 26 -10l138 -107q44 23 91 38q16 136 29 186q7 28 36 28h222q14 0 24.5 -8.5t11.5 -21.5l28 -184q49 -16 90 -37l142 107q9 9 24 9q13 0 25 -10q129 -119 165 -170q7 -8 7 -22
+q0 -12 -8 -23q-15 -21 -51 -66.5t-54 -70.5q26 -50 41 -98l183 -28q13 -2 21 -12.5t8 -23.5z" />
+    <glyph glyph-name="trash" unicode="&#xf014;" horiz-adv-x="1408" 
+d="M512 800v-576q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h64q14 0 23 -9t9 -23zM768 800v-576q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h64q14 0 23 -9t9 -23zM1024 800v-576q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v576
+q0 14 9 23t23 9h64q14 0 23 -9t9 -23zM1152 76v948h-896v-948q0 -22 7 -40.5t14.5 -27t10.5 -8.5h832q3 0 10.5 8.5t14.5 27t7 40.5zM480 1152h448l-48 117q-7 9 -17 11h-317q-10 -2 -17 -11zM1408 1120v-64q0 -14 -9 -23t-23 -9h-96v-948q0 -83 -47 -143.5t-113 -60.5h-832
+q-66 0 -113 58.5t-47 141.5v952h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h309l70 167q15 37 54 63t79 26h320q40 0 79 -26t54 -63l70 -167h309q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="home" unicode="&#xf015;" horiz-adv-x="1664" 
+d="M1408 544v-480q0 -26 -19 -45t-45 -19h-384v384h-256v-384h-384q-26 0 -45 19t-19 45v480q0 1 0.5 3t0.5 3l575 474l575 -474q1 -2 1 -6zM1631 613l-62 -74q-8 -9 -21 -11h-3q-13 0 -21 7l-692 577l-692 -577q-12 -8 -24 -7q-13 2 -21 11l-62 74q-8 10 -7 23.5t11 21.5
+l719 599q32 26 76 26t76 -26l244 -204v195q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-408l219 -182q10 -8 11 -21.5t-7 -23.5z" />
+    <glyph glyph-name="file_alt" unicode="&#xf016;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+" />
+    <glyph glyph-name="time" unicode="&#xf017;" 
+d="M896 992v-448q0 -14 -9 -23t-23 -9h-320q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h224v352q0 14 9 23t23 9h64q14 0 23 -9t9 -23zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="road" unicode="&#xf018;" horiz-adv-x="1920" 
+d="M1111 540v4l-24 320q-1 13 -11 22.5t-23 9.5h-186q-13 0 -23 -9.5t-11 -22.5l-24 -320v-4q-1 -12 8 -20t21 -8h244q12 0 21 8t8 20zM1870 73q0 -73 -46 -73h-704q13 0 22 9.5t8 22.5l-20 256q-1 13 -11 22.5t-23 9.5h-272q-13 0 -23 -9.5t-11 -22.5l-20 -256
+q-1 -13 8 -22.5t22 -9.5h-704q-46 0 -46 73q0 54 26 116l417 1044q8 19 26 33t38 14h339q-13 0 -23 -9.5t-11 -22.5l-15 -192q-1 -14 8 -23t22 -9h166q13 0 22 9t8 23l-15 192q-1 13 -11 22.5t-23 9.5h339q20 0 38 -14t26 -33l417 -1044q26 -62 26 -116z" />
+    <glyph glyph-name="download_alt" unicode="&#xf019;" horiz-adv-x="1664" 
+d="M1280 192q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1536 192q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1664 416v-320q0 -40 -28 -68t-68 -28h-1472q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h465l135 -136
+q58 -56 136 -56t136 56l136 136h464q40 0 68 -28t28 -68zM1339 985q17 -41 -14 -70l-448 -448q-18 -19 -45 -19t-45 19l-448 448q-31 29 -14 70q17 39 59 39h256v448q0 26 19 45t45 19h256q26 0 45 -19t19 -45v-448h256q42 0 59 -39z" />
+    <glyph glyph-name="download" unicode="&#xf01a;" 
+d="M1120 608q0 -12 -10 -24l-319 -319q-11 -9 -23 -9t-23 9l-320 320q-15 16 -7 35q8 20 30 20h192v352q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-352h192q14 0 23 -9t9 -23zM768 1184q-148 0 -273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273
+t-73 273t-198 198t-273 73zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="upload" unicode="&#xf01b;" 
+d="M1118 660q-8 -20 -30 -20h-192v-352q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v352h-192q-14 0 -23 9t-9 23q0 12 10 24l319 319q11 9 23 9t23 -9l320 -320q15 -16 7 -35zM768 1184q-148 0 -273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198
+t73 273t-73 273t-198 198t-273 73zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="inbox" unicode="&#xf01c;" 
+d="M1023 576h316q-1 3 -2.5 8.5t-2.5 7.5l-212 496h-708l-212 -496q-1 -3 -2.5 -8.5t-2.5 -7.5h316l95 -192h320zM1536 546v-482q0 -26 -19 -45t-45 -19h-1408q-26 0 -45 19t-19 45v482q0 62 25 123l238 552q10 25 36.5 42t52.5 17h832q26 0 52.5 -17t36.5 -42l238 -552
+q25 -61 25 -123z" />
+    <glyph glyph-name="play_circle" unicode="&#xf01d;" 
+d="M1184 640q0 -37 -32 -55l-544 -320q-15 -9 -32 -9q-16 0 -32 8q-32 19 -32 56v640q0 37 32 56q33 18 64 -1l544 -320q32 -18 32 -55zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="repeat" unicode="&#xf01e;" 
+d="M1536 1280v-448q0 -26 -19 -45t-45 -19h-448q-42 0 -59 40q-17 39 14 69l138 138q-148 137 -349 137q-104 0 -198.5 -40.5t-163.5 -109.5t-109.5 -163.5t-40.5 -198.5t40.5 -198.5t109.5 -163.5t163.5 -109.5t198.5 -40.5q119 0 225 52t179 147q7 10 23 12q15 0 25 -9
+l137 -138q9 -8 9.5 -20.5t-7.5 -22.5q-109 -132 -264 -204.5t-327 -72.5q-156 0 -298 61t-245 164t-164 245t-61 298t61 298t164 245t245 164t298 61q147 0 284.5 -55.5t244.5 -156.5l130 129q29 31 70 14q39 -17 39 -59z" />
+    <glyph glyph-name="refresh" unicode="&#xf021;" 
+d="M1511 480q0 -5 -1 -7q-64 -268 -268 -434.5t-478 -166.5q-146 0 -282.5 55t-243.5 157l-129 -129q-19 -19 -45 -19t-45 19t-19 45v448q0 26 19 45t45 19h448q26 0 45 -19t19 -45t-19 -45l-137 -137q71 -66 161 -102t187 -36q134 0 250 65t186 179q11 17 53 117
+q8 23 30 23h192q13 0 22.5 -9.5t9.5 -22.5zM1536 1280v-448q0 -26 -19 -45t-45 -19h-448q-26 0 -45 19t-19 45t19 45l138 138q-148 137 -349 137q-134 0 -250 -65t-186 -179q-11 -17 -53 -117q-8 -23 -30 -23h-199q-13 0 -22.5 9.5t-9.5 22.5v7q65 268 270 434.5t480 166.5
+q146 0 284 -55.5t245 -156.5l130 129q19 19 45 19t45 -19t19 -45z" />
+    <glyph glyph-name="list_alt" unicode="&#xf022;" horiz-adv-x="1792" 
+d="M384 352v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 608v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M384 864v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM1536 352v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-960q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h960q13 0 22.5 -9.5t9.5 -22.5z
+M1536 608v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-960q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h960q13 0 22.5 -9.5t9.5 -22.5zM1536 864v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-960q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h960q13 0 22.5 -9.5
+t9.5 -22.5zM1664 160v832q0 13 -9.5 22.5t-22.5 9.5h-1472q-13 0 -22.5 -9.5t-9.5 -22.5v-832q0 -13 9.5 -22.5t22.5 -9.5h1472q13 0 22.5 9.5t9.5 22.5zM1792 1248v-1088q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1472q66 0 113 -47
+t47 -113z" />
+    <glyph glyph-name="lock" unicode="&#xf023;" horiz-adv-x="1152" 
+d="M320 768h512v192q0 106 -75 181t-181 75t-181 -75t-75 -181v-192zM1152 672v-576q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v576q0 40 28 68t68 28h32v192q0 184 132 316t316 132t316 -132t132 -316v-192h32q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="flag" unicode="&#xf024;" horiz-adv-x="1792" 
+d="M320 1280q0 -72 -64 -110v-1266q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v1266q-64 38 -64 110q0 53 37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1792 1216v-763q0 -25 -12.5 -38.5t-39.5 -27.5q-215 -116 -369 -116q-61 0 -123.5 22t-108.5 48
+t-115.5 48t-142.5 22q-192 0 -464 -146q-17 -9 -33 -9q-26 0 -45 19t-19 45v742q0 32 31 55q21 14 79 43q236 120 421 120q107 0 200 -29t219 -88q38 -19 88 -19q54 0 117.5 21t110 47t88 47t54.5 21q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="headphones" unicode="&#xf025;" horiz-adv-x="1664" 
+d="M1664 650q0 -166 -60 -314l-20 -49l-185 -33q-22 -83 -90.5 -136.5t-156.5 -53.5v-32q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-32q71 0 130 -35.5t93 -95.5l68 12q29 95 29 193q0 148 -88 279t-236.5 209t-315.5 78
+t-315.5 -78t-236.5 -209t-88 -279q0 -98 29 -193l68 -12q34 60 93 95.5t130 35.5v32q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-576q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v32q-88 0 -156.5 53.5t-90.5 136.5l-185 33l-20 49q-60 148 -60 314q0 151 67 291t179 242.5
+t266 163.5t320 61t320 -61t266 -163.5t179 -242.5t67 -291z" />
+    <glyph glyph-name="volume_off" unicode="&#xf026;" horiz-adv-x="768" 
+d="M768 1184v-1088q0 -26 -19 -45t-45 -19t-45 19l-333 333h-262q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h262l333 333q19 19 45 19t45 -19t19 -45z" />
+    <glyph glyph-name="volume_down" unicode="&#xf027;" horiz-adv-x="1152" 
+d="M768 1184v-1088q0 -26 -19 -45t-45 -19t-45 19l-333 333h-262q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h262l333 333q19 19 45 19t45 -19t19 -45zM1152 640q0 -76 -42.5 -141.5t-112.5 -93.5q-10 -5 -25 -5q-26 0 -45 18.5t-19 45.5q0 21 12 35.5t29 25t34 23t29 36
+t12 56.5t-12 56.5t-29 36t-34 23t-29 25t-12 35.5q0 27 19 45.5t45 18.5q15 0 25 -5q70 -27 112.5 -93t42.5 -142z" />
+    <glyph glyph-name="volume_up" unicode="&#xf028;" horiz-adv-x="1664" 
+d="M768 1184v-1088q0 -26 -19 -45t-45 -19t-45 19l-333 333h-262q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h262l333 333q19 19 45 19t45 -19t19 -45zM1152 640q0 -76 -42.5 -141.5t-112.5 -93.5q-10 -5 -25 -5q-26 0 -45 18.5t-19 45.5q0 21 12 35.5t29 25t34 23t29 36
+t12 56.5t-12 56.5t-29 36t-34 23t-29 25t-12 35.5q0 27 19 45.5t45 18.5q15 0 25 -5q70 -27 112.5 -93t42.5 -142zM1408 640q0 -153 -85 -282.5t-225 -188.5q-13 -5 -25 -5q-27 0 -46 19t-19 45q0 39 39 59q56 29 76 44q74 54 115.5 135.5t41.5 173.5t-41.5 173.5
+t-115.5 135.5q-20 15 -76 44q-39 20 -39 59q0 26 19 45t45 19q13 0 26 -5q140 -59 225 -188.5t85 -282.5zM1664 640q0 -230 -127 -422.5t-338 -283.5q-13 -5 -26 -5q-26 0 -45 19t-19 45q0 36 39 59q7 4 22.5 10.5t22.5 10.5q46 25 82 51q123 91 192 227t69 289t-69 289
+t-192 227q-36 26 -82 51q-7 4 -22.5 10.5t-22.5 10.5q-39 23 -39 59q0 26 19 45t45 19q13 0 26 -5q211 -91 338 -283.5t127 -422.5z" />
+    <glyph glyph-name="qrcode" unicode="&#xf029;" horiz-adv-x="1408" 
+d="M384 384v-128h-128v128h128zM384 1152v-128h-128v128h128zM1152 1152v-128h-128v128h128zM128 129h384v383h-384v-383zM128 896h384v384h-384v-384zM896 896h384v384h-384v-384zM640 640v-640h-640v640h640zM1152 128v-128h-128v128h128zM1408 128v-128h-128v128h128z
+M1408 640v-384h-384v128h-128v-384h-128v640h384v-128h128v128h128zM640 1408v-640h-640v640h640zM1408 1408v-640h-640v640h640z" />
+    <glyph glyph-name="barcode" unicode="&#xf02a;" horiz-adv-x="1792" 
+d="M63 0h-63v1408h63v-1408zM126 1h-32v1407h32v-1407zM220 1h-31v1407h31v-1407zM377 1h-31v1407h31v-1407zM534 1h-62v1407h62v-1407zM660 1h-31v1407h31v-1407zM723 1h-31v1407h31v-1407zM786 1h-31v1407h31v-1407zM943 1h-63v1407h63v-1407zM1100 1h-63v1407h63v-1407z
+M1226 1h-63v1407h63v-1407zM1352 1h-63v1407h63v-1407zM1446 1h-63v1407h63v-1407zM1635 1h-94v1407h94v-1407zM1698 1h-32v1407h32v-1407zM1792 0h-63v1408h63v-1408z" />
+    <glyph glyph-name="tag" unicode="&#xf02b;" 
+d="M448 1088q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1515 512q0 -53 -37 -90l-491 -492q-39 -37 -91 -37q-53 0 -90 37l-715 716q-38 37 -64.5 101t-26.5 117v416q0 52 38 90t90 38h416q53 0 117 -26.5t102 -64.5
+l715 -714q37 -39 37 -91z" />
+    <glyph glyph-name="tags" unicode="&#xf02c;" horiz-adv-x="1920" 
+d="M448 1088q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1515 512q0 -53 -37 -90l-491 -492q-39 -37 -91 -37q-53 0 -90 37l-715 716q-38 37 -64.5 101t-26.5 117v416q0 52 38 90t90 38h416q53 0 117 -26.5t102 -64.5
+l715 -714q37 -39 37 -91zM1899 512q0 -53 -37 -90l-491 -492q-39 -37 -91 -37q-36 0 -59 14t-53 45l470 470q37 37 37 90q0 52 -37 91l-715 714q-38 38 -102 64.5t-117 26.5h224q53 0 117 -26.5t102 -64.5l715 -714q37 -39 37 -91z" />
+    <glyph glyph-name="book" unicode="&#xf02d;" horiz-adv-x="1664" 
+d="M1639 1058q40 -57 18 -129l-275 -906q-19 -64 -76.5 -107.5t-122.5 -43.5h-923q-77 0 -148.5 53.5t-99.5 131.5q-24 67 -2 127q0 4 3 27t4 37q1 8 -3 21.5t-3 19.5q2 11 8 21t16.5 23.5t16.5 23.5q23 38 45 91.5t30 91.5q3 10 0.5 30t-0.5 28q3 11 17 28t17 23
+q21 36 42 92t25 90q1 9 -2.5 32t0.5 28q4 13 22 30.5t22 22.5q19 26 42.5 84.5t27.5 96.5q1 8 -3 25.5t-2 26.5q2 8 9 18t18 23t17 21q8 12 16.5 30.5t15 35t16 36t19.5 32t26.5 23.5t36 11.5t47.5 -5.5l-1 -3q38 9 51 9h761q74 0 114 -56t18 -130l-274 -906
+q-36 -119 -71.5 -153.5t-128.5 -34.5h-869q-27 0 -38 -15q-11 -16 -1 -43q24 -70 144 -70h923q29 0 56 15.5t35 41.5l300 987q7 22 5 57q38 -15 59 -43zM575 1056q-4 -13 2 -22.5t20 -9.5h608q13 0 25.5 9.5t16.5 22.5l21 64q4 13 -2 22.5t-20 9.5h-608q-13 0 -25.5 -9.5
+t-16.5 -22.5zM492 800q-4 -13 2 -22.5t20 -9.5h608q13 0 25.5 9.5t16.5 22.5l21 64q4 13 -2 22.5t-20 9.5h-608q-13 0 -25.5 -9.5t-16.5 -22.5z" />
+    <glyph glyph-name="bookmark" unicode="&#xf02e;" horiz-adv-x="1280" 
+d="M1164 1408q23 0 44 -9q33 -13 52.5 -41t19.5 -62v-1289q0 -34 -19.5 -62t-52.5 -41q-19 -8 -44 -8q-48 0 -83 32l-441 424l-441 -424q-36 -33 -83 -33q-23 0 -44 9q-33 13 -52.5 41t-19.5 62v1289q0 34 19.5 62t52.5 41q21 9 44 9h1048z" />
+    <glyph glyph-name="print" unicode="&#xf02f;" horiz-adv-x="1664" 
+d="M384 0h896v256h-896v-256zM384 640h896v384h-160q-40 0 -68 28t-28 68v160h-640v-640zM1536 576q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1664 576v-416q0 -13 -9.5 -22.5t-22.5 -9.5h-224v-160q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68
+v160h-224q-13 0 -22.5 9.5t-9.5 22.5v416q0 79 56.5 135.5t135.5 56.5h64v544q0 40 28 68t68 28h672q40 0 88 -20t76 -48l152 -152q28 -28 48 -76t20 -88v-256h64q79 0 135.5 -56.5t56.5 -135.5z" />
+    <glyph glyph-name="camera" unicode="&#xf030;" horiz-adv-x="1920" 
+d="M960 864q119 0 203.5 -84.5t84.5 -203.5t-84.5 -203.5t-203.5 -84.5t-203.5 84.5t-84.5 203.5t84.5 203.5t203.5 84.5zM1664 1280q106 0 181 -75t75 -181v-896q0 -106 -75 -181t-181 -75h-1408q-106 0 -181 75t-75 181v896q0 106 75 181t181 75h224l51 136
+q19 49 69.5 84.5t103.5 35.5h512q53 0 103.5 -35.5t69.5 -84.5l51 -136h224zM960 128q185 0 316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="font" unicode="&#xf031;" horiz-adv-x="1664" 
+d="M725 977l-170 -450q33 0 136.5 -2t160.5 -2q19 0 57 2q-87 253 -184 452zM0 -128l2 79q23 7 56 12.5t57 10.5t49.5 14.5t44.5 29t31 50.5l237 616l280 724h75h53q8 -14 11 -21l205 -480q33 -78 106 -257.5t114 -274.5q15 -34 58 -144.5t72 -168.5q20 -45 35 -57
+q19 -15 88 -29.5t84 -20.5q6 -38 6 -57q0 -5 -0.5 -13.5t-0.5 -12.5q-63 0 -190 8t-191 8q-76 0 -215 -7t-178 -8q0 43 4 78l131 28q1 0 12.5 2.5t15.5 3.5t14.5 4.5t15 6.5t11 8t9 11t2.5 14q0 16 -31 96.5t-72 177.5t-42 100l-450 2q-26 -58 -76.5 -195.5t-50.5 -162.5
+q0 -22 14 -37.5t43.5 -24.5t48.5 -13.5t57 -8.5t41 -4q1 -19 1 -58q0 -9 -2 -27q-58 0 -174.5 10t-174.5 10q-8 0 -26.5 -4t-21.5 -4q-80 -14 -188 -14z" />
+    <glyph glyph-name="bold" unicode="&#xf032;" horiz-adv-x="1408" 
+d="M555 15q74 -32 140 -32q376 0 376 335q0 114 -41 180q-27 44 -61.5 74t-67.5 46.5t-80.5 25t-84 10.5t-94.5 2q-73 0 -101 -10q0 -53 -0.5 -159t-0.5 -158q0 -8 -1 -67.5t-0.5 -96.5t4.5 -83.5t12 -66.5zM541 761q42 -7 109 -7q82 0 143 13t110 44.5t74.5 89.5t25.5 142
+q0 70 -29 122.5t-79 82t-108 43.5t-124 14q-50 0 -130 -13q0 -50 4 -151t4 -152q0 -27 -0.5 -80t-0.5 -79q0 -46 1 -69zM0 -128l2 94q15 4 85 16t106 27q7 12 12.5 27t8.5 33.5t5.5 32.5t3 37.5t0.5 34v35.5v30q0 982 -22 1025q-4 8 -22 14.5t-44.5 11t-49.5 7t-48.5 4.5
+t-30.5 3l-4 83q98 2 340 11.5t373 9.5q23 0 68 -0.5t68 -0.5q70 0 136.5 -13t128.5 -42t108 -71t74 -104.5t28 -137.5q0 -52 -16.5 -95.5t-39 -72t-64.5 -57.5t-73 -45t-84 -40q154 -35 256.5 -134t102.5 -248q0 -100 -35 -179.5t-93.5 -130.5t-138 -85.5t-163.5 -48.5
+t-176 -14q-44 0 -132 3t-132 3q-106 0 -307 -11t-231 -12z" />
+    <glyph glyph-name="italic" unicode="&#xf033;" horiz-adv-x="1024" 
+d="M0 -126l17 85q22 7 61.5 16.5t72 19t59.5 23.5q28 35 41 101q1 7 62 289t114 543.5t52 296.5v25q-24 13 -54.5 18.5t-69.5 8t-58 5.5l19 103q33 -2 120 -6.5t149.5 -7t120.5 -2.5q48 0 98.5 2.5t121 7t98.5 6.5q-5 -39 -19 -89q-30 -10 -101.5 -28.5t-108.5 -33.5
+q-8 -19 -14 -42.5t-9 -40t-7.5 -45.5t-6.5 -42q-27 -148 -87.5 -419.5t-77.5 -355.5q-2 -9 -13 -58t-20 -90t-16 -83.5t-6 -57.5l1 -18q17 -4 185 -31q-3 -44 -16 -99q-11 0 -32.5 -1.5t-32.5 -1.5q-29 0 -87 10t-86 10q-138 2 -206 2q-51 0 -143 -9t-121 -11z" />
+    <glyph glyph-name="text_height" unicode="&#xf034;" horiz-adv-x="1792" 
+d="M1744 128q33 0 42 -18.5t-11 -44.5l-126 -162q-20 -26 -49 -26t-49 26l-126 162q-20 26 -11 44.5t42 18.5h80v1024h-80q-33 0 -42 18.5t11 44.5l126 162q20 26 49 26t49 -26l126 -162q20 -26 11 -44.5t-42 -18.5h-80v-1024h80zM81 1407l54 -27q12 -5 211 -5q44 0 132 2
+t132 2q36 0 107.5 -0.5t107.5 -0.5h293q6 0 21 -0.5t20.5 0t16 3t17.5 9t15 17.5l42 1q4 0 14 -0.5t14 -0.5q2 -112 2 -336q0 -80 -5 -109q-39 -14 -68 -18q-25 44 -54 128q-3 9 -11 48t-14.5 73.5t-7.5 35.5q-6 8 -12 12.5t-15.5 6t-13 2.5t-18 0.5t-16.5 -0.5
+q-17 0 -66.5 0.5t-74.5 0.5t-64 -2t-71 -6q-9 -81 -8 -136q0 -94 2 -388t2 -455q0 -16 -2.5 -71.5t0 -91.5t12.5 -69q40 -21 124 -42.5t120 -37.5q5 -40 5 -50q0 -14 -3 -29l-34 -1q-76 -2 -218 8t-207 10q-50 0 -151 -9t-152 -9q-3 51 -3 52v9q17 27 61.5 43t98.5 29t78 27
+q19 42 19 383q0 101 -3 303t-3 303v117q0 2 0.5 15.5t0.5 25t-1 25.5t-3 24t-5 14q-11 12 -162 12q-33 0 -93 -12t-80 -26q-19 -13 -34 -72.5t-31.5 -111t-42.5 -53.5q-42 26 -56 44v383z" />
+    <glyph glyph-name="text_width" unicode="&#xf035;" 
+d="M81 1407l54 -27q12 -5 211 -5q44 0 132 2t132 2q70 0 246.5 1t304.5 0.5t247 -4.5q33 -1 56 31l42 1q4 0 14 -0.5t14 -0.5q2 -112 2 -336q0 -80 -5 -109q-39 -14 -68 -18q-25 44 -54 128q-3 9 -11 47.5t-15 73.5t-7 36q-10 13 -27 19q-5 2 -66 2q-30 0 -93 1t-103 1
+t-94 -2t-96 -7q-9 -81 -8 -136l1 -152v52q0 -55 1 -154t1.5 -180t0.5 -153q0 -16 -2.5 -71.5t0 -91.5t12.5 -69q40 -21 124 -42.5t120 -37.5q5 -40 5 -50q0 -14 -3 -29l-34 -1q-76 -2 -218 8t-207 10q-50 0 -151 -9t-152 -9q-3 51 -3 52v9q17 27 61.5 43t98.5 29t78 27
+q7 16 11.5 74t6 145.5t1.5 155t-0.5 153.5t-0.5 89q0 7 -2.5 21.5t-2.5 22.5q0 7 0.5 44t1 73t0 76.5t-3 67.5t-6.5 32q-11 12 -162 12q-41 0 -163 -13.5t-138 -24.5q-19 -12 -34 -71.5t-31.5 -111.5t-42.5 -54q-42 26 -56 44v383zM1310 125q12 0 42 -19.5t57.5 -41.5
+t59.5 -49t36 -30q26 -21 26 -49t-26 -49q-4 -3 -36 -30t-59.5 -49t-57.5 -41.5t-42 -19.5q-13 0 -20.5 10.5t-10 28.5t-2.5 33.5t1.5 33t1.5 19.5h-1024q0 -2 1.5 -19.5t1.5 -33t-2.5 -33.5t-10 -28.5t-20.5 -10.5q-12 0 -42 19.5t-57.5 41.5t-59.5 49t-36 30q-26 21 -26 49
+t26 49q4 3 36 30t59.5 49t57.5 41.5t42 19.5q13 0 20.5 -10.5t10 -28.5t2.5 -33.5t-1.5 -33t-1.5 -19.5h1024q0 2 -1.5 19.5t-1.5 33t2.5 33.5t10 28.5t20.5 10.5z" />
+    <glyph glyph-name="align_left" unicode="&#xf036;" horiz-adv-x="1792" 
+d="M1792 192v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1408 576v-128q0 -26 -19 -45t-45 -19h-1280q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1280q26 0 45 -19t19 -45zM1664 960v-128q0 -26 -19 -45
+t-45 -19h-1536q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1536q26 0 45 -19t19 -45zM1280 1344v-128q0 -26 -19 -45t-45 -19h-1152q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1152q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="align_center" unicode="&#xf037;" horiz-adv-x="1792" 
+d="M1792 192v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1408 576v-128q0 -26 -19 -45t-45 -19h-896q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h896q26 0 45 -19t19 -45zM1664 960v-128q0 -26 -19 -45t-45 -19
+h-1408q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1408q26 0 45 -19t19 -45zM1280 1344v-128q0 -26 -19 -45t-45 -19h-640q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h640q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="align_right" unicode="&#xf038;" horiz-adv-x="1792" 
+d="M1792 192v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 576v-128q0 -26 -19 -45t-45 -19h-1280q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1280q26 0 45 -19t19 -45zM1792 960v-128q0 -26 -19 -45
+t-45 -19h-1536q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1536q26 0 45 -19t19 -45zM1792 1344v-128q0 -26 -19 -45t-45 -19h-1152q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1152q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="align_justify" unicode="&#xf039;" horiz-adv-x="1792" 
+d="M1792 192v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 576v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 960v-128q0 -26 -19 -45
+t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 1344v-128q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1664q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="list" unicode="&#xf03a;" horiz-adv-x="1792" 
+d="M256 224v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-192q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h192q13 0 22.5 -9.5t9.5 -22.5zM256 608v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-192q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h192q13 0 22.5 -9.5
+t9.5 -22.5zM256 992v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-192q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h192q13 0 22.5 -9.5t9.5 -22.5zM1792 224v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1344q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1344
+q13 0 22.5 -9.5t9.5 -22.5zM256 1376v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-192q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h192q13 0 22.5 -9.5t9.5 -22.5zM1792 608v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1344q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5
+t22.5 9.5h1344q13 0 22.5 -9.5t9.5 -22.5zM1792 992v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1344q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1344q13 0 22.5 -9.5t9.5 -22.5zM1792 1376v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1344q-13 0 -22.5 9.5t-9.5 22.5v192
+q0 13 9.5 22.5t22.5 9.5h1344q13 0 22.5 -9.5t9.5 -22.5z" />
+    <glyph glyph-name="indent_left" unicode="&#xf03b;" horiz-adv-x="1792" 
+d="M384 992v-576q0 -13 -9.5 -22.5t-22.5 -9.5q-14 0 -23 9l-288 288q-9 9 -9 23t9 23l288 288q9 9 23 9q13 0 22.5 -9.5t9.5 -22.5zM1792 224v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1728q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1728q13 0 22.5 -9.5
+t9.5 -22.5zM1792 608v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1088q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1088q13 0 22.5 -9.5t9.5 -22.5zM1792 992v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1088q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1088
+q13 0 22.5 -9.5t9.5 -22.5zM1792 1376v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1728q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1728q13 0 22.5 -9.5t9.5 -22.5z" />
+    <glyph glyph-name="indent_right" unicode="&#xf03c;" horiz-adv-x="1792" 
+d="M352 704q0 -14 -9 -23l-288 -288q-9 -9 -23 -9q-13 0 -22.5 9.5t-9.5 22.5v576q0 13 9.5 22.5t22.5 9.5q14 0 23 -9l288 -288q9 -9 9 -23zM1792 224v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1728q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1728q13 0 22.5 -9.5
+t9.5 -22.5zM1792 608v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1088q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1088q13 0 22.5 -9.5t9.5 -22.5zM1792 992v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1088q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1088
+q13 0 22.5 -9.5t9.5 -22.5zM1792 1376v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1728q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1728q13 0 22.5 -9.5t9.5 -22.5z" />
+    <glyph glyph-name="facetime_video" unicode="&#xf03d;" horiz-adv-x="1792" 
+d="M1792 1184v-1088q0 -42 -39 -59q-13 -5 -25 -5q-27 0 -45 19l-403 403v-166q0 -119 -84.5 -203.5t-203.5 -84.5h-704q-119 0 -203.5 84.5t-84.5 203.5v704q0 119 84.5 203.5t203.5 84.5h704q119 0 203.5 -84.5t84.5 -203.5v-165l403 402q18 19 45 19q12 0 25 -5
+q39 -17 39 -59z" />
+    <glyph glyph-name="picture" unicode="&#xf03e;" horiz-adv-x="1920" 
+d="M640 960q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1664 576v-448h-1408v192l320 320l160 -160l512 512zM1760 1280h-1600q-13 0 -22.5 -9.5t-9.5 -22.5v-1216q0 -13 9.5 -22.5t22.5 -9.5h1600q13 0 22.5 9.5t9.5 22.5v1216
+q0 13 -9.5 22.5t-22.5 9.5zM1920 1248v-1216q0 -66 -47 -113t-113 -47h-1600q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1600q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="pencil" unicode="&#xf040;" 
+d="M363 0l91 91l-235 235l-91 -91v-107h128v-128h107zM886 928q0 22 -22 22q-10 0 -17 -7l-542 -542q-7 -7 -7 -17q0 -22 22 -22q10 0 17 7l542 542q7 7 7 17zM832 1120l416 -416l-832 -832h-416v416zM1515 1024q0 -53 -37 -90l-166 -166l-416 416l166 165q36 38 90 38
+q53 0 91 -38l235 -234q37 -39 37 -91z" />
+    <glyph glyph-name="map_marker" unicode="&#xf041;" horiz-adv-x="1024" 
+d="M768 896q0 106 -75 181t-181 75t-181 -75t-75 -181t75 -181t181 -75t181 75t75 181zM1024 896q0 -109 -33 -179l-364 -774q-16 -33 -47.5 -52t-67.5 -19t-67.5 19t-46.5 52l-365 774q-33 70 -33 179q0 212 150 362t362 150t362 -150t150 -362z" />
+    <glyph glyph-name="adjust" unicode="&#xf042;" 
+d="M768 96v1088q-148 0 -273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="tint" unicode="&#xf043;" horiz-adv-x="1024" 
+d="M512 384q0 36 -20 69q-1 1 -15.5 22.5t-25.5 38t-25 44t-21 50.5q-4 16 -21 16t-21 -16q-7 -23 -21 -50.5t-25 -44t-25.5 -38t-15.5 -22.5q-20 -33 -20 -69q0 -53 37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1024 512q0 -212 -150 -362t-362 -150t-362 150t-150 362
+q0 145 81 275q6 9 62.5 90.5t101 151t99.5 178t83 201.5q9 30 34 47t51 17t51.5 -17t33.5 -47q28 -93 83 -201.5t99.5 -178t101 -151t62.5 -90.5q81 -127 81 -275z" />
+    <glyph glyph-name="edit" unicode="&#xf044;" horiz-adv-x="1792" 
+d="M888 352l116 116l-152 152l-116 -116v-56h96v-96h56zM1328 1072q-16 16 -33 -1l-350 -350q-17 -17 -1 -33t33 1l350 350q17 17 1 33zM1408 478v-190q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h832
+q63 0 117 -25q15 -7 18 -23q3 -17 -9 -29l-49 -49q-14 -14 -32 -8q-23 6 -45 6h-832q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832q66 0 113 47t47 113v126q0 13 9 22l64 64q15 15 35 7t20 -29zM1312 1216l288 -288l-672 -672h-288v288zM1756 1084l-92 -92
+l-288 288l92 92q28 28 68 28t68 -28l152 -152q28 -28 28 -68t-28 -68z" />
+    <glyph glyph-name="share" unicode="&#xf045;" horiz-adv-x="1664" 
+d="M1408 547v-259q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h255v0q13 0 22.5 -9.5t9.5 -22.5q0 -27 -26 -32q-77 -26 -133 -60q-10 -4 -16 -4h-112q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832
+q66 0 113 47t47 113v214q0 19 18 29q28 13 54 37q16 16 35 8q21 -9 21 -29zM1645 1043l-384 -384q-18 -19 -45 -19q-12 0 -25 5q-39 17 -39 59v192h-160q-323 0 -438 -131q-119 -137 -74 -473q3 -23 -20 -34q-8 -2 -12 -2q-16 0 -26 13q-10 14 -21 31t-39.5 68.5t-49.5 99.5
+t-38.5 114t-17.5 122q0 49 3.5 91t14 90t28 88t47 81.5t68.5 74t94.5 61.5t124.5 48.5t159.5 30.5t196.5 11h160v192q0 42 39 59q13 5 25 5q26 0 45 -19l384 -384q19 -19 19 -45t-19 -45z" />
+    <glyph glyph-name="check" unicode="&#xf046;" horiz-adv-x="1664" 
+d="M1408 606v-318q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h832q63 0 117 -25q15 -7 18 -23q3 -17 -9 -29l-49 -49q-10 -10 -23 -10q-3 0 -9 2q-23 6 -45 6h-832q-66 0 -113 -47t-47 -113v-832
+q0 -66 47 -113t113 -47h832q66 0 113 47t47 113v254q0 13 9 22l64 64q10 10 23 10q6 0 12 -3q20 -8 20 -29zM1639 1095l-814 -814q-24 -24 -57 -24t-57 24l-430 430q-24 24 -24 57t24 57l110 110q24 24 57 24t57 -24l263 -263l647 647q24 24 57 24t57 -24l110 -110
+q24 -24 24 -57t-24 -57z" />
+    <glyph glyph-name="move" unicode="&#xf047;" horiz-adv-x="1792" 
+d="M1792 640q0 -26 -19 -45l-256 -256q-19 -19 -45 -19t-45 19t-19 45v128h-384v-384h128q26 0 45 -19t19 -45t-19 -45l-256 -256q-19 -19 -45 -19t-45 19l-256 256q-19 19 -19 45t19 45t45 19h128v384h-384v-128q0 -26 -19 -45t-45 -19t-45 19l-256 256q-19 19 -19 45
+t19 45l256 256q19 19 45 19t45 -19t19 -45v-128h384v384h-128q-26 0 -45 19t-19 45t19 45l256 256q19 19 45 19t45 -19l256 -256q19 -19 19 -45t-19 -45t-45 -19h-128v-384h384v128q0 26 19 45t45 19t45 -19l256 -256q19 -19 19 -45z" />
+    <glyph glyph-name="step_backward" unicode="&#xf048;" horiz-adv-x="1024" 
+d="M979 1395q19 19 32 13t13 -32v-1472q0 -26 -13 -32t-32 13l-710 710q-9 9 -13 19v-678q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-678q4 10 13 19z" />
+    <glyph glyph-name="fast_backward" unicode="&#xf049;" horiz-adv-x="1792" 
+d="M1747 1395q19 19 32 13t13 -32v-1472q0 -26 -13 -32t-32 13l-710 710q-9 9 -13 19v-710q0 -26 -13 -32t-32 13l-710 710q-9 9 -13 19v-678q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-678q4 10 13 19l710 710
+q19 19 32 13t13 -32v-710q4 10 13 19z" />
+    <glyph glyph-name="backward" unicode="&#xf04a;" horiz-adv-x="1664" 
+d="M1619 1395q19 19 32 13t13 -32v-1472q0 -26 -13 -32t-32 13l-710 710q-9 9 -13 19v-710q0 -26 -13 -32t-32 13l-710 710q-19 19 -19 45t19 45l710 710q19 19 32 13t13 -32v-710q4 10 13 19z" />
+    <glyph glyph-name="play" unicode="&#xf04b;" horiz-adv-x="1408" 
+d="M1384 609l-1328 -738q-23 -13 -39.5 -3t-16.5 36v1472q0 26 16.5 36t39.5 -3l1328 -738q23 -13 23 -31t-23 -31z" />
+    <glyph glyph-name="pause" unicode="&#xf04c;" 
+d="M1536 1344v-1408q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h512q26 0 45 -19t19 -45zM640 1344v-1408q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h512q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="stop" unicode="&#xf04d;" 
+d="M1536 1344v-1408q0 -26 -19 -45t-45 -19h-1408q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h1408q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="forward" unicode="&#xf04e;" horiz-adv-x="1664" 
+d="M45 -115q-19 -19 -32 -13t-13 32v1472q0 26 13 32t32 -13l710 -710q9 -9 13 -19v710q0 26 13 32t32 -13l710 -710q19 -19 19 -45t-19 -45l-710 -710q-19 -19 -32 -13t-13 32v710q-4 -10 -13 -19z" />
+    <glyph glyph-name="fast_forward" unicode="&#xf050;" horiz-adv-x="1792" 
+d="M45 -115q-19 -19 -32 -13t-13 32v1472q0 26 13 32t32 -13l710 -710q9 -9 13 -19v710q0 26 13 32t32 -13l710 -710q9 -9 13 -19v678q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-1408q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v678q-4 -10 -13 -19l-710 -710
+q-19 -19 -32 -13t-13 32v710q-4 -10 -13 -19z" />
+    <glyph glyph-name="step_forward" unicode="&#xf051;" horiz-adv-x="1024" 
+d="M45 -115q-19 -19 -32 -13t-13 32v1472q0 26 13 32t32 -13l710 -710q9 -9 13 -19v678q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-1408q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v678q-4 -10 -13 -19z" />
+    <glyph glyph-name="eject" unicode="&#xf052;" horiz-adv-x="1538" 
+d="M14 557l710 710q19 19 45 19t45 -19l710 -710q19 -19 13 -32t-32 -13h-1472q-26 0 -32 13t13 32zM1473 0h-1408q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h1408q26 0 45 -19t19 -45v-256q0 -26 -19 -45t-45 -19z" />
+    <glyph glyph-name="chevron_left" unicode="&#xf053;" horiz-adv-x="1280" 
+d="M1171 1235l-531 -531l531 -531q19 -19 19 -45t-19 -45l-166 -166q-19 -19 -45 -19t-45 19l-742 742q-19 19 -19 45t19 45l742 742q19 19 45 19t45 -19l166 -166q19 -19 19 -45t-19 -45z" />
+    <glyph glyph-name="chevron_right" unicode="&#xf054;" horiz-adv-x="1280" 
+d="M1107 659l-742 -742q-19 -19 -45 -19t-45 19l-166 166q-19 19 -19 45t19 45l531 531l-531 531q-19 19 -19 45t19 45l166 166q19 19 45 19t45 -19l742 -742q19 -19 19 -45t-19 -45z" />
+    <glyph glyph-name="plus_sign" unicode="&#xf055;" 
+d="M1216 576v128q0 26 -19 45t-45 19h-256v256q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-256h-256q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h256v-256q0 -26 19 -45t45 -19h128q26 0 45 19t19 45v256h256q26 0 45 19t19 45zM1536 640q0 -209 -103 -385.5
+t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="minus_sign" unicode="&#xf056;" 
+d="M1216 576v128q0 26 -19 45t-45 19h-768q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h768q26 0 45 19t19 45zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5
+t103 -385.5z" />
+    <glyph glyph-name="remove_sign" unicode="&#xf057;" 
+d="M1149 414q0 26 -19 45l-181 181l181 181q19 19 19 45q0 27 -19 46l-90 90q-19 19 -46 19q-26 0 -45 -19l-181 -181l-181 181q-19 19 -45 19q-27 0 -46 -19l-90 -90q-19 -19 -19 -46q0 -26 19 -45l181 -181l-181 -181q-19 -19 -19 -45q0 -27 19 -46l90 -90q19 -19 46 -19
+q26 0 45 19l181 181l181 -181q19 -19 45 -19q27 0 46 19l90 90q19 19 19 46zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="ok_sign" unicode="&#xf058;" 
+d="M1284 802q0 28 -18 46l-91 90q-19 19 -45 19t-45 -19l-408 -407l-226 226q-19 19 -45 19t-45 -19l-91 -90q-18 -18 -18 -46q0 -27 18 -45l362 -362q19 -19 45 -19q27 0 46 19l543 543q18 18 18 45zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103
+t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="question_sign" unicode="&#xf059;" 
+d="M896 160v192q0 14 -9 23t-23 9h-192q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h192q14 0 23 9t9 23zM1152 832q0 88 -55.5 163t-138.5 116t-170 41q-243 0 -371 -213q-15 -24 8 -42l132 -100q7 -6 19 -6q16 0 25 12q53 68 86 92q34 24 86 24q48 0 85.5 -26t37.5 -59
+q0 -38 -20 -61t-68 -45q-63 -28 -115.5 -86.5t-52.5 -125.5v-36q0 -14 9 -23t23 -9h192q14 0 23 9t9 23q0 19 21.5 49.5t54.5 49.5q32 18 49 28.5t46 35t44.5 48t28 60.5t12.5 81zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5
+t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="info_sign" unicode="&#xf05a;" 
+d="M1024 160v160q0 14 -9 23t-23 9h-96v512q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-160q0 -14 9 -23t23 -9h96v-320h-96q-14 0 -23 -9t-9 -23v-160q0 -14 9 -23t23 -9h448q14 0 23 9t9 23zM896 1056v160q0 14 -9 23t-23 9h-192q-14 0 -23 -9t-9 -23v-160q0 -14 9 -23
+t23 -9h192q14 0 23 9t9 23zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="screenshot" unicode="&#xf05b;" 
+d="M1197 512h-109q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h109q-32 108 -112.5 188.5t-188.5 112.5v-109q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v109q-108 -32 -188.5 -112.5t-112.5 -188.5h109q26 0 45 -19t19 -45v-128q0 -26 -19 -45t-45 -19h-109
+q32 -108 112.5 -188.5t188.5 -112.5v109q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-109q108 32 188.5 112.5t112.5 188.5zM1536 704v-128q0 -26 -19 -45t-45 -19h-143q-37 -161 -154.5 -278.5t-278.5 -154.5v-143q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v143
+q-161 37 -278.5 154.5t-154.5 278.5h-143q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h143q37 161 154.5 278.5t278.5 154.5v143q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-143q161 -37 278.5 -154.5t154.5 -278.5h143q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="remove_circle" unicode="&#xf05c;" 
+d="M1097 457l-146 -146q-10 -10 -23 -10t-23 10l-137 137l-137 -137q-10 -10 -23 -10t-23 10l-146 146q-10 10 -10 23t10 23l137 137l-137 137q-10 10 -10 23t10 23l146 146q10 10 23 10t23 -10l137 -137l137 137q10 10 23 10t23 -10l146 -146q10 -10 10 -23t-10 -23
+l-137 -137l137 -137q10 -10 10 -23t-10 -23zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5
+t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="ok_circle" unicode="&#xf05d;" 
+d="M1171 723l-422 -422q-19 -19 -45 -19t-45 19l-294 294q-19 19 -19 45t19 45l102 102q19 19 45 19t45 -19l147 -147l275 275q19 19 45 19t45 -19l102 -102q19 -19 19 -45t-19 -45zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273t73 -273t198 -198
+t273 -73t273 73t198 198t73 273zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="ban_circle" unicode="&#xf05e;" 
+d="M1312 643q0 161 -87 295l-754 -753q137 -89 297 -89q111 0 211.5 43.5t173.5 116.5t116 174.5t43 212.5zM313 344l755 754q-135 91 -300 91q-148 0 -273 -73t-198 -199t-73 -274q0 -162 89 -299zM1536 643q0 -157 -61 -300t-163.5 -246t-245 -164t-298.5 -61t-298.5 61
+t-245 164t-163.5 246t-61 300t61 299.5t163.5 245.5t245 164t298.5 61t298.5 -61t245 -164t163.5 -245.5t61 -299.5z" />
+    <glyph glyph-name="arrow_left" unicode="&#xf060;" 
+d="M1536 640v-128q0 -53 -32.5 -90.5t-84.5 -37.5h-704l293 -294q38 -36 38 -90t-38 -90l-75 -76q-37 -37 -90 -37q-52 0 -91 37l-651 652q-37 37 -37 90q0 52 37 91l651 650q38 38 91 38q52 0 90 -38l75 -74q38 -38 38 -91t-38 -91l-293 -293h704q52 0 84.5 -37.5
+t32.5 -90.5z" />
+    <glyph glyph-name="arrow_right" unicode="&#xf061;" 
+d="M1472 576q0 -54 -37 -91l-651 -651q-39 -37 -91 -37q-51 0 -90 37l-75 75q-38 38 -38 91t38 91l293 293h-704q-52 0 -84.5 37.5t-32.5 90.5v128q0 53 32.5 90.5t84.5 37.5h704l-293 294q-38 36 -38 90t38 90l75 75q38 38 90 38q53 0 91 -38l651 -651q37 -35 37 -90z" />
+    <glyph glyph-name="arrow_up" unicode="&#xf062;" horiz-adv-x="1664" 
+d="M1611 565q0 -51 -37 -90l-75 -75q-38 -38 -91 -38q-54 0 -90 38l-294 293v-704q0 -52 -37.5 -84.5t-90.5 -32.5h-128q-53 0 -90.5 32.5t-37.5 84.5v704l-294 -293q-36 -38 -90 -38t-90 38l-75 75q-38 38 -38 90q0 53 38 91l651 651q35 37 90 37q54 0 91 -37l651 -651
+q37 -39 37 -91z" />
+    <glyph glyph-name="arrow_down" unicode="&#xf063;" horiz-adv-x="1664" 
+d="M1611 704q0 -53 -37 -90l-651 -652q-39 -37 -91 -37q-53 0 -90 37l-651 652q-38 36 -38 90q0 53 38 91l74 75q39 37 91 37q53 0 90 -37l294 -294v704q0 52 38 90t90 38h128q52 0 90 -38t38 -90v-704l294 294q37 37 90 37q52 0 91 -37l75 -75q37 -39 37 -91z" />
+    <glyph glyph-name="share_alt" unicode="&#xf064;" horiz-adv-x="1792" 
+d="M1792 896q0 -26 -19 -45l-512 -512q-19 -19 -45 -19t-45 19t-19 45v256h-224q-98 0 -175.5 -6t-154 -21.5t-133 -42.5t-105.5 -69.5t-80 -101t-48.5 -138.5t-17.5 -181q0 -55 5 -123q0 -6 2.5 -23.5t2.5 -26.5q0 -15 -8.5 -25t-23.5 -10q-16 0 -28 17q-7 9 -13 22
+t-13.5 30t-10.5 24q-127 285 -127 451q0 199 53 333q162 403 875 403h224v256q0 26 19 45t45 19t45 -19l512 -512q19 -19 19 -45z" />
+    <glyph glyph-name="resize_full" unicode="&#xf065;" 
+d="M755 480q0 -13 -10 -23l-332 -332l144 -144q19 -19 19 -45t-19 -45t-45 -19h-448q-26 0 -45 19t-19 45v448q0 26 19 45t45 19t45 -19l144 -144l332 332q10 10 23 10t23 -10l114 -114q10 -10 10 -23zM1536 1344v-448q0 -26 -19 -45t-45 -19t-45 19l-144 144l-332 -332
+q-10 -10 -23 -10t-23 10l-114 114q-10 10 -10 23t10 23l332 332l-144 144q-19 19 -19 45t19 45t45 19h448q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="resize_small" unicode="&#xf066;" 
+d="M768 576v-448q0 -26 -19 -45t-45 -19t-45 19l-144 144l-332 -332q-10 -10 -23 -10t-23 10l-114 114q-10 10 -10 23t10 23l332 332l-144 144q-19 19 -19 45t19 45t45 19h448q26 0 45 -19t19 -45zM1523 1248q0 -13 -10 -23l-332 -332l144 -144q19 -19 19 -45t-19 -45
+t-45 -19h-448q-26 0 -45 19t-19 45v448q0 26 19 45t45 19t45 -19l144 -144l332 332q10 10 23 10t23 -10l114 -114q10 -10 10 -23z" />
+    <glyph glyph-name="plus" unicode="&#xf067;" horiz-adv-x="1408" 
+d="M1408 800v-192q0 -40 -28 -68t-68 -28h-416v-416q0 -40 -28 -68t-68 -28h-192q-40 0 -68 28t-28 68v416h-416q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h416v416q0 40 28 68t68 28h192q40 0 68 -28t28 -68v-416h416q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="minus" unicode="&#xf068;" horiz-adv-x="1408" 
+d="M1408 800v-192q0 -40 -28 -68t-68 -28h-1216q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h1216q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="asterisk" unicode="&#xf069;" horiz-adv-x="1664" 
+d="M1482 486q46 -26 59.5 -77.5t-12.5 -97.5l-64 -110q-26 -46 -77.5 -59.5t-97.5 12.5l-266 153v-307q0 -52 -38 -90t-90 -38h-128q-52 0 -90 38t-38 90v307l-266 -153q-46 -26 -97.5 -12.5t-77.5 59.5l-64 110q-26 46 -12.5 97.5t59.5 77.5l266 154l-266 154
+q-46 26 -59.5 77.5t12.5 97.5l64 110q26 46 77.5 59.5t97.5 -12.5l266 -153v307q0 52 38 90t90 38h128q52 0 90 -38t38 -90v-307l266 153q46 26 97.5 12.5t77.5 -59.5l64 -110q26 -46 12.5 -97.5t-59.5 -77.5l-266 -154z" />
+    <glyph glyph-name="exclamation_sign" unicode="&#xf06a;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM896 161v190q0 14 -9 23.5t-22 9.5h-192q-13 0 -23 -10t-10 -23v-190q0 -13 10 -23t23 -10h192
+q13 0 22 9.5t9 23.5zM894 505l18 621q0 12 -10 18q-10 8 -24 8h-220q-14 0 -24 -8q-10 -6 -10 -18l17 -621q0 -10 10 -17.5t24 -7.5h185q14 0 23.5 7.5t10.5 17.5z" />
+    <glyph glyph-name="gift" unicode="&#xf06b;" 
+d="M928 180v56v468v192h-320v-192v-468v-56q0 -25 18 -38.5t46 -13.5h192q28 0 46 13.5t18 38.5zM472 1024h195l-126 161q-26 31 -69 31q-40 0 -68 -28t-28 -68t28 -68t68 -28zM1160 1120q0 40 -28 68t-68 28q-43 0 -69 -31l-125 -161h194q40 0 68 28t28 68zM1536 864v-320
+q0 -14 -9 -23t-23 -9h-96v-416q0 -40 -28 -68t-68 -28h-1088q-40 0 -68 28t-28 68v416h-96q-14 0 -23 9t-9 23v320q0 14 9 23t23 9h440q-93 0 -158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5q107 0 168 -77l128 -165l128 165q61 77 168 77q93 0 158.5 -65.5t65.5 -158.5
+t-65.5 -158.5t-158.5 -65.5h440q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="leaf" unicode="&#xf06c;" horiz-adv-x="1792" 
+d="M1280 832q0 26 -19 45t-45 19q-172 0 -318 -49.5t-259.5 -134t-235.5 -219.5q-19 -21 -19 -45q0 -26 19 -45t45 -19q24 0 45 19q27 24 74 71t67 66q137 124 268.5 176t313.5 52q26 0 45 19t19 45zM1792 1030q0 -95 -20 -193q-46 -224 -184.5 -383t-357.5 -268
+q-214 -108 -438 -108q-148 0 -286 47q-15 5 -88 42t-96 37q-16 0 -39.5 -32t-45 -70t-52.5 -70t-60 -32q-43 0 -63.5 17.5t-45.5 59.5q-2 4 -6 11t-5.5 10t-3 9.5t-1.5 13.5q0 35 31 73.5t68 65.5t68 56t31 48q0 4 -14 38t-16 44q-9 51 -9 104q0 115 43.5 220t119 184.5
+t170.5 139t204 95.5q55 18 145 25.5t179.5 9t178.5 6t163.5 24t113.5 56.5l29.5 29.5t29.5 28t27 20t36.5 16t43.5 4.5q39 0 70.5 -46t47.5 -112t24 -124t8 -96z" />
+    <glyph glyph-name="fire" unicode="&#xf06d;" horiz-adv-x="1408" 
+d="M1408 -160v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-1344q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h1344q13 0 22.5 -9.5t9.5 -22.5zM1152 896q0 -78 -24.5 -144t-64 -112.5t-87.5 -88t-96 -77.5t-87.5 -72t-64 -81.5t-24.5 -96.5q0 -96 67 -224l-4 1l1 -1
+q-90 41 -160 83t-138.5 100t-113.5 122.5t-72.5 150.5t-27.5 184q0 78 24.5 144t64 112.5t87.5 88t96 77.5t87.5 72t64 81.5t24.5 96.5q0 94 -66 224l3 -1l-1 1q90 -41 160 -83t138.5 -100t113.5 -122.5t72.5 -150.5t27.5 -184z" />
+    <glyph glyph-name="eye_open" unicode="&#xf06e;" horiz-adv-x="1792" 
+d="M1664 576q-152 236 -381 353q61 -104 61 -225q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 121 61 225q-229 -117 -381 -353q133 -205 333.5 -326.5t434.5 -121.5t434.5 121.5t333.5 326.5zM944 960q0 20 -14 34t-34 14q-125 0 -214.5 -89.5
+t-89.5 -214.5q0 -20 14 -34t34 -14t34 14t14 34q0 86 61 147t147 61q20 0 34 14t14 34zM1792 576q0 -34 -20 -69q-140 -230 -376.5 -368.5t-499.5 -138.5t-499.5 139t-376.5 368q-20 35 -20 69t20 69q140 229 376.5 368t499.5 139t499.5 -139t376.5 -368q20 -35 20 -69z" />
+    <glyph glyph-name="eye_close" unicode="&#xf070;" horiz-adv-x="1792" 
+d="M555 201l78 141q-87 63 -136 159t-49 203q0 121 61 225q-229 -117 -381 -353q167 -258 427 -375zM944 960q0 20 -14 34t-34 14q-125 0 -214.5 -89.5t-89.5 -214.5q0 -20 14 -34t34 -14t34 14t14 34q0 86 61 147t147 61q20 0 34 14t14 34zM1307 1151q0 -7 -1 -9
+q-106 -189 -316 -567t-315 -566l-49 -89q-10 -16 -28 -16q-12 0 -134 70q-16 10 -16 28q0 12 44 87q-143 65 -263.5 173t-208.5 245q-20 31 -20 69t20 69q153 235 380 371t496 136q89 0 180 -17l54 97q10 16 28 16q5 0 18 -6t31 -15.5t33 -18.5t31.5 -18.5t19.5 -11.5
+q16 -10 16 -27zM1344 704q0 -139 -79 -253.5t-209 -164.5l280 502q8 -45 8 -84zM1792 576q0 -35 -20 -69q-39 -64 -109 -145q-150 -172 -347.5 -267t-419.5 -95l74 132q212 18 392.5 137t301.5 307q-115 179 -282 294l63 112q95 -64 182.5 -153t144.5 -184q20 -34 20 -69z
+" />
+    <glyph glyph-name="warning_sign" unicode="&#xf071;" horiz-adv-x="1792" 
+d="M1024 161v190q0 14 -9.5 23.5t-22.5 9.5h-192q-13 0 -22.5 -9.5t-9.5 -23.5v-190q0 -14 9.5 -23.5t22.5 -9.5h192q13 0 22.5 9.5t9.5 23.5zM1022 535l18 459q0 12 -10 19q-13 11 -24 11h-220q-11 0 -24 -11q-10 -7 -10 -21l17 -457q0 -10 10 -16.5t24 -6.5h185
+q14 0 23.5 6.5t10.5 16.5zM1008 1469l768 -1408q35 -63 -2 -126q-17 -29 -46.5 -46t-63.5 -17h-1536q-34 0 -63.5 17t-46.5 46q-37 63 -2 126l768 1408q17 31 47 49t65 18t65 -18t47 -49z" />
+    <glyph glyph-name="plane" unicode="&#xf072;" horiz-adv-x="1408" 
+d="M1376 1376q44 -52 12 -148t-108 -172l-161 -161l160 -696q5 -19 -12 -33l-128 -96q-7 -6 -19 -6q-4 0 -7 1q-15 3 -21 16l-279 508l-259 -259l53 -194q5 -17 -8 -31l-96 -96q-9 -9 -23 -9h-2q-15 2 -24 13l-189 252l-252 189q-11 7 -13 23q-1 13 9 25l96 97q9 9 23 9
+q6 0 8 -1l194 -53l259 259l-508 279q-14 8 -17 24q-2 16 9 27l128 128q14 13 30 8l665 -159l160 160q76 76 172 108t148 -12z" />
+    <glyph glyph-name="calendar" unicode="&#xf073;" horiz-adv-x="1664" 
+d="M128 -128h288v288h-288v-288zM480 -128h320v288h-320v-288zM128 224h288v320h-288v-320zM480 224h320v320h-320v-320zM128 608h288v288h-288v-288zM864 -128h320v288h-320v-288zM480 608h320v288h-320v-288zM1248 -128h288v288h-288v-288zM864 224h320v320h-320v-320z
+M512 1088v288q0 13 -9.5 22.5t-22.5 9.5h-64q-13 0 -22.5 -9.5t-9.5 -22.5v-288q0 -13 9.5 -22.5t22.5 -9.5h64q13 0 22.5 9.5t9.5 22.5zM1248 224h288v320h-288v-320zM864 608h320v288h-320v-288zM1248 608h288v288h-288v-288zM1280 1088v288q0 13 -9.5 22.5t-22.5 9.5h-64
+q-13 0 -22.5 -9.5t-9.5 -22.5v-288q0 -13 9.5 -22.5t22.5 -9.5h64q13 0 22.5 9.5t9.5 22.5zM1664 1152v-1280q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h384v96q0 66 47 113t113 47
+h64q66 0 113 -47t47 -113v-96h128q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="random" unicode="&#xf074;" horiz-adv-x="1792" 
+d="M666 1055q-60 -92 -137 -273q-22 45 -37 72.5t-40.5 63.5t-51 56.5t-63 35t-81.5 14.5h-224q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h224q250 0 410 -225zM1792 256q0 -14 -9 -23l-320 -320q-9 -9 -23 -9q-13 0 -22.5 9.5t-9.5 22.5v192q-32 0 -85 -0.5t-81 -1t-73 1
+t-71 5t-64 10.5t-63 18.5t-58 28.5t-59 40t-55 53.5t-56 69.5q59 93 136 273q22 -45 37 -72.5t40.5 -63.5t51 -56.5t63 -35t81.5 -14.5h256v192q0 14 9 23t23 9q12 0 24 -10l319 -319q9 -9 9 -23zM1792 1152q0 -14 -9 -23l-320 -320q-9 -9 -23 -9q-13 0 -22.5 9.5t-9.5 22.5
+v192h-256q-48 0 -87 -15t-69 -45t-51 -61.5t-45 -77.5q-32 -62 -78 -171q-29 -66 -49.5 -111t-54 -105t-64 -100t-74 -83t-90 -68.5t-106.5 -42t-128 -16.5h-224q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h224q48 0 87 15t69 45t51 61.5t45 77.5q32 62 78 171q29 66 49.5 111
+t54 105t64 100t74 83t90 68.5t106.5 42t128 16.5h256v192q0 14 9 23t23 9q12 0 24 -10l319 -319q9 -9 9 -23z" />
+    <glyph glyph-name="comment" unicode="&#xf075;" horiz-adv-x="1792" 
+d="M1792 640q0 -174 -120 -321.5t-326 -233t-450 -85.5q-70 0 -145 8q-198 -175 -460 -242q-49 -14 -114 -22q-17 -2 -30.5 9t-17.5 29v1q-3 4 -0.5 12t2 10t4.5 9.5l6 9t7 8.5t8 9q7 8 31 34.5t34.5 38t31 39.5t32.5 51t27 59t26 76q-157 89 -247.5 220t-90.5 281
+q0 130 71 248.5t191 204.5t286 136.5t348 50.5q244 0 450 -85.5t326 -233t120 -321.5z" />
+    <glyph glyph-name="magnet" unicode="&#xf076;" 
+d="M1536 704v-128q0 -201 -98.5 -362t-274 -251.5t-395.5 -90.5t-395.5 90.5t-274 251.5t-98.5 362v128q0 26 19 45t45 19h384q26 0 45 -19t19 -45v-128q0 -52 23.5 -90t53.5 -57t71 -30t64 -13t44 -2t44 2t64 13t71 30t53.5 57t23.5 90v128q0 26 19 45t45 19h384
+q26 0 45 -19t19 -45zM512 1344v-384q0 -26 -19 -45t-45 -19h-384q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h384q26 0 45 -19t19 -45zM1536 1344v-384q0 -26 -19 -45t-45 -19h-384q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h384q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="chevron_up" unicode="&#xf077;" horiz-adv-x="1792" 
+d="M1683 205l-166 -165q-19 -19 -45 -19t-45 19l-531 531l-531 -531q-19 -19 -45 -19t-45 19l-166 165q-19 19 -19 45.5t19 45.5l742 741q19 19 45 19t45 -19l742 -741q19 -19 19 -45.5t-19 -45.5z" />
+    <glyph glyph-name="chevron_down" unicode="&#xf078;" horiz-adv-x="1792" 
+d="M1683 728l-742 -741q-19 -19 -45 -19t-45 19l-742 741q-19 19 -19 45.5t19 45.5l166 165q19 19 45 19t45 -19l531 -531l531 531q19 19 45 19t45 -19l166 -165q19 -19 19 -45.5t-19 -45.5z" />
+    <glyph glyph-name="retweet" unicode="&#xf079;" horiz-adv-x="1920" 
+d="M1280 32q0 -13 -9.5 -22.5t-22.5 -9.5h-960q-8 0 -13.5 2t-9 7t-5.5 8t-3 11.5t-1 11.5v13v11v160v416h-192q-26 0 -45 19t-19 45q0 24 15 41l320 384q19 22 49 22t49 -22l320 -384q15 -17 15 -41q0 -26 -19 -45t-45 -19h-192v-384h576q16 0 25 -11l160 -192q7 -10 7 -21
+zM1920 448q0 -24 -15 -41l-320 -384q-20 -23 -49 -23t-49 23l-320 384q-15 17 -15 41q0 26 19 45t45 19h192v384h-576q-16 0 -25 12l-160 192q-7 9 -7 20q0 13 9.5 22.5t22.5 9.5h960q8 0 13.5 -2t9 -7t5.5 -8t3 -11.5t1 -11.5v-13v-11v-160v-416h192q26 0 45 -19t19 -45z
+" />
+    <glyph glyph-name="shopping_cart" unicode="&#xf07a;" horiz-adv-x="1664" 
+d="M640 0q0 -52 -38 -90t-90 -38t-90 38t-38 90t38 90t90 38t90 -38t38 -90zM1536 0q0 -52 -38 -90t-90 -38t-90 38t-38 90t38 90t90 38t90 -38t38 -90zM1664 1088v-512q0 -24 -16.5 -42.5t-40.5 -21.5l-1044 -122q13 -60 13 -70q0 -16 -24 -64h920q26 0 45 -19t19 -45
+t-19 -45t-45 -19h-1024q-26 0 -45 19t-19 45q0 11 8 31.5t16 36t21.5 40t15.5 29.5l-177 823h-204q-26 0 -45 19t-19 45t19 45t45 19h256q16 0 28.5 -6.5t19.5 -15.5t13 -24.5t8 -26t5.5 -29.5t4.5 -26h1201q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="folder_close" unicode="&#xf07b;" horiz-adv-x="1664" 
+d="M1664 928v-704q0 -92 -66 -158t-158 -66h-1216q-92 0 -158 66t-66 158v960q0 92 66 158t158 66h320q92 0 158 -66t66 -158v-32h672q92 0 158 -66t66 -158z" />
+    <glyph glyph-name="folder_open" unicode="&#xf07c;" horiz-adv-x="1920" 
+d="M1879 584q0 -31 -31 -66l-336 -396q-43 -51 -120.5 -86.5t-143.5 -35.5h-1088q-34 0 -60.5 13t-26.5 43q0 31 31 66l336 396q43 51 120.5 86.5t143.5 35.5h1088q34 0 60.5 -13t26.5 -43zM1536 928v-160h-832q-94 0 -197 -47.5t-164 -119.5l-337 -396l-5 -6q0 4 -0.5 12.5
+t-0.5 12.5v960q0 92 66 158t158 66h320q92 0 158 -66t66 -158v-32h544q92 0 158 -66t66 -158z" />
+    <glyph glyph-name="resize_vertical" unicode="&#xf07d;" horiz-adv-x="768" 
+d="M704 1216q0 -26 -19 -45t-45 -19h-128v-1024h128q26 0 45 -19t19 -45t-19 -45l-256 -256q-19 -19 -45 -19t-45 19l-256 256q-19 19 -19 45t19 45t45 19h128v1024h-128q-26 0 -45 19t-19 45t19 45l256 256q19 19 45 19t45 -19l256 -256q19 -19 19 -45z" />
+    <glyph glyph-name="resize_horizontal" unicode="&#xf07e;" horiz-adv-x="1792" 
+d="M1792 640q0 -26 -19 -45l-256 -256q-19 -19 -45 -19t-45 19t-19 45v128h-1024v-128q0 -26 -19 -45t-45 -19t-45 19l-256 256q-19 19 -19 45t19 45l256 256q19 19 45 19t45 -19t19 -45v-128h1024v128q0 26 19 45t45 19t45 -19l256 -256q19 -19 19 -45z" />
+    <glyph glyph-name="bar_chart" unicode="&#xf080;" horiz-adv-x="2048" 
+d="M640 640v-512h-256v512h256zM1024 1152v-1024h-256v1024h256zM2048 0v-128h-2048v1536h128v-1408h1920zM1408 896v-768h-256v768h256zM1792 1280v-1152h-256v1152h256z" />
+    <glyph glyph-name="twitter_sign" unicode="&#xf081;" 
+d="M1280 926q-56 -25 -121 -34q68 40 93 117q-65 -38 -134 -51q-61 66 -153 66q-87 0 -148.5 -61.5t-61.5 -148.5q0 -29 5 -48q-129 7 -242 65t-192 155q-29 -50 -29 -106q0 -114 91 -175q-47 1 -100 26v-2q0 -75 50 -133.5t123 -72.5q-29 -8 -51 -8q-13 0 -39 4
+q21 -63 74.5 -104t121.5 -42q-116 -90 -261 -90q-26 0 -50 3q148 -94 322 -94q112 0 210 35.5t168 95t120.5 137t75 162t24.5 168.5q0 18 -1 27q63 45 105 109zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5
+t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="facebook_sign" unicode="&#xf082;" 
+d="M1248 1408q119 0 203.5 -84.5t84.5 -203.5v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-188v595h199l30 232h-229v148q0 56 23.5 84t91.5 28l122 1v207q-63 9 -178 9q-136 0 -217.5 -80t-81.5 -226v-171h-200v-232h200v-595h-532q-119 0 -203.5 84.5t-84.5 203.5v960
+q0 119 84.5 203.5t203.5 84.5h960z" />
+    <glyph glyph-name="camera_retro" unicode="&#xf083;" horiz-adv-x="1792" 
+d="M928 704q0 14 -9 23t-23 9q-66 0 -113 -47t-47 -113q0 -14 9 -23t23 -9t23 9t9 23q0 40 28 68t68 28q14 0 23 9t9 23zM1152 574q0 -106 -75 -181t-181 -75t-181 75t-75 181t75 181t181 75t181 -75t75 -181zM128 0h1536v128h-1536v-128zM1280 574q0 159 -112.5 271.5
+t-271.5 112.5t-271.5 -112.5t-112.5 -271.5t112.5 -271.5t271.5 -112.5t271.5 112.5t112.5 271.5zM256 1216h384v128h-384v-128zM128 1024h1536v118v138h-828l-64 -128h-644v-128zM1792 1280v-1280q0 -53 -37.5 -90.5t-90.5 -37.5h-1536q-53 0 -90.5 37.5t-37.5 90.5v1280
+q0 53 37.5 90.5t90.5 37.5h1536q53 0 90.5 -37.5t37.5 -90.5z" />
+    <glyph glyph-name="key" unicode="&#xf084;" horiz-adv-x="1792" 
+d="M832 1024q0 80 -56 136t-136 56t-136 -56t-56 -136q0 -42 19 -83q-41 19 -83 19q-80 0 -136 -56t-56 -136t56 -136t136 -56t136 56t56 136q0 42 -19 83q41 -19 83 -19q80 0 136 56t56 136zM1683 320q0 -17 -49 -66t-66 -49q-9 0 -28.5 16t-36.5 33t-38.5 40t-24.5 26
+l-96 -96l220 -220q28 -28 28 -68q0 -42 -39 -81t-81 -39q-40 0 -68 28l-671 671q-176 -131 -365 -131q-163 0 -265.5 102.5t-102.5 265.5q0 160 95 313t248 248t313 95q163 0 265.5 -102.5t102.5 -265.5q0 -189 -131 -365l355 -355l96 96q-3 3 -26 24.5t-40 38.5t-33 36.5
+t-16 28.5q0 17 49 66t66 49q13 0 23 -10q6 -6 46 -44.5t82 -79.5t86.5 -86t73 -78t28.5 -41z" />
+    <glyph glyph-name="cogs" unicode="&#xf085;" horiz-adv-x="1920" 
+d="M896 640q0 106 -75 181t-181 75t-181 -75t-75 -181t75 -181t181 -75t181 75t75 181zM1664 128q0 52 -38 90t-90 38t-90 -38t-38 -90q0 -53 37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1664 1152q0 52 -38 90t-90 38t-90 -38t-38 -90q0 -53 37.5 -90.5t90.5 -37.5
+t90.5 37.5t37.5 90.5zM1280 731v-185q0 -10 -7 -19.5t-16 -10.5l-155 -24q-11 -35 -32 -76q34 -48 90 -115q7 -11 7 -20q0 -12 -7 -19q-23 -30 -82.5 -89.5t-78.5 -59.5q-11 0 -21 7l-115 90q-37 -19 -77 -31q-11 -108 -23 -155q-7 -24 -30 -24h-186q-11 0 -20 7.5t-10 17.5
+l-23 153q-34 10 -75 31l-118 -89q-7 -7 -20 -7q-11 0 -21 8q-144 133 -144 160q0 9 7 19q10 14 41 53t47 61q-23 44 -35 82l-152 24q-10 1 -17 9.5t-7 19.5v185q0 10 7 19.5t16 10.5l155 24q11 35 32 76q-34 48 -90 115q-7 11 -7 20q0 12 7 20q22 30 82 89t79 59q11 0 21 -7
+l115 -90q34 18 77 32q11 108 23 154q7 24 30 24h186q11 0 20 -7.5t10 -17.5l23 -153q34 -10 75 -31l118 89q8 7 20 7q11 0 21 -8q144 -133 144 -160q0 -8 -7 -19q-12 -16 -42 -54t-45 -60q23 -48 34 -82l152 -23q10 -2 17 -10.5t7 -19.5zM1920 198v-140q0 -16 -149 -31
+q-12 -27 -30 -52q51 -113 51 -138q0 -4 -4 -7q-122 -71 -124 -71q-8 0 -46 47t-52 68q-20 -2 -30 -2t-30 2q-14 -21 -52 -68t-46 -47q-2 0 -124 71q-4 3 -4 7q0 25 51 138q-18 25 -30 52q-149 15 -149 31v140q0 16 149 31q13 29 30 52q-51 113 -51 138q0 4 4 7q4 2 35 20
+t59 34t30 16q8 0 46 -46.5t52 -67.5q20 2 30 2t30 -2q51 71 92 112l6 2q4 0 124 -70q4 -3 4 -7q0 -25 -51 -138q17 -23 30 -52q149 -15 149 -31zM1920 1222v-140q0 -16 -149 -31q-12 -27 -30 -52q51 -113 51 -138q0 -4 -4 -7q-122 -71 -124 -71q-8 0 -46 47t-52 68
+q-20 -2 -30 -2t-30 2q-14 -21 -52 -68t-46 -47q-2 0 -124 71q-4 3 -4 7q0 25 51 138q-18 25 -30 52q-149 15 -149 31v140q0 16 149 31q13 29 30 52q-51 113 -51 138q0 4 4 7q4 2 35 20t59 34t30 16q8 0 46 -46.5t52 -67.5q20 2 30 2t30 -2q51 71 92 112l6 2q4 0 124 -70
+q4 -3 4 -7q0 -25 -51 -138q17 -23 30 -52q149 -15 149 -31z" />
+    <glyph glyph-name="comments" unicode="&#xf086;" horiz-adv-x="1792" 
+d="M1408 768q0 -139 -94 -257t-256.5 -186.5t-353.5 -68.5q-86 0 -176 16q-124 -88 -278 -128q-36 -9 -86 -16h-3q-11 0 -20.5 8t-11.5 21q-1 3 -1 6.5t0.5 6.5t2 6l2.5 5t3.5 5.5t4 5t4.5 5t4 4.5q5 6 23 25t26 29.5t22.5 29t25 38.5t20.5 44q-124 72 -195 177t-71 224
+q0 139 94 257t256.5 186.5t353.5 68.5t353.5 -68.5t256.5 -186.5t94 -257zM1792 512q0 -120 -71 -224.5t-195 -176.5q10 -24 20.5 -44t25 -38.5t22.5 -29t26 -29.5t23 -25q1 -1 4 -4.5t4.5 -5t4 -5t3.5 -5.5l2.5 -5t2 -6t0.5 -6.5t-1 -6.5q-3 -14 -13 -22t-22 -7
+q-50 7 -86 16q-154 40 -278 128q-90 -16 -176 -16q-271 0 -472 132q58 -4 88 -4q161 0 309 45t264 129q125 92 192 212t67 254q0 77 -23 152q129 -71 204 -178t75 -230z" />
+    <glyph glyph-name="thumbs_up_alt" unicode="&#xf087;" 
+d="M256 192q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1408 768q0 51 -39 89.5t-89 38.5h-352q0 58 48 159.5t48 160.5q0 98 -32 145t-128 47q-26 -26 -38 -85t-30.5 -125.5t-59.5 -109.5q-22 -23 -77 -91q-4 -5 -23 -30t-31.5 -41t-34.5 -42.5
+t-40 -44t-38.5 -35.5t-40 -27t-35.5 -9h-32v-640h32q13 0 31.5 -3t33 -6.5t38 -11t35 -11.5t35.5 -12.5t29 -10.5q211 -73 342 -73h121q192 0 192 167q0 26 -5 56q30 16 47.5 52.5t17.5 73.5t-18 69q53 50 53 119q0 25 -10 55.5t-25 47.5q32 1 53.5 47t21.5 81zM1536 769
+q0 -89 -49 -163q9 -33 9 -69q0 -77 -38 -144q3 -21 3 -43q0 -101 -60 -178q1 -139 -85 -219.5t-227 -80.5h-36h-93q-96 0 -189.5 22.5t-216.5 65.5q-116 40 -138 40h-288q-53 0 -90.5 37.5t-37.5 90.5v640q0 53 37.5 90.5t90.5 37.5h274q36 24 137 155q58 75 107 128
+q24 25 35.5 85.5t30.5 126.5t62 108q39 37 90 37q84 0 151 -32.5t102 -101.5t35 -186q0 -93 -48 -192h176q104 0 180 -76t76 -179z" />
+    <glyph glyph-name="thumbs_down_alt" unicode="&#xf088;" 
+d="M256 1088q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1408 512q0 35 -21.5 81t-53.5 47q15 17 25 47.5t10 55.5q0 69 -53 119q18 31 18 69q0 37 -17.5 73.5t-47.5 52.5q5 30 5 56q0 85 -49 126t-136 41h-128q-131 0 -342 -73q-5 -2 -29 -10.5
+t-35.5 -12.5t-35 -11.5t-38 -11t-33 -6.5t-31.5 -3h-32v-640h32q16 0 35.5 -9t40 -27t38.5 -35.5t40 -44t34.5 -42.5t31.5 -41t23 -30q55 -68 77 -91q41 -43 59.5 -109.5t30.5 -125.5t38 -85q96 0 128 47t32 145q0 59 -48 160.5t-48 159.5h352q50 0 89 38.5t39 89.5z
+M1536 511q0 -103 -76 -179t-180 -76h-176q48 -99 48 -192q0 -118 -35 -186q-35 -69 -102 -101.5t-151 -32.5q-51 0 -90 37q-34 33 -54 82t-25.5 90.5t-17.5 84.5t-31 64q-48 50 -107 127q-101 131 -137 155h-274q-53 0 -90.5 37.5t-37.5 90.5v640q0 53 37.5 90.5t90.5 37.5
+h288q22 0 138 40q128 44 223 66t200 22h112q140 0 226.5 -79t85.5 -216v-5q60 -77 60 -178q0 -22 -3 -43q38 -67 38 -144q0 -36 -9 -69q49 -73 49 -163z" />
+    <glyph glyph-name="star_half" unicode="&#xf089;" horiz-adv-x="896" 
+d="M832 1504v-1339l-449 -236q-22 -12 -40 -12q-21 0 -31.5 14.5t-10.5 35.5q0 6 2 20l86 500l-364 354q-25 27 -25 48q0 37 56 46l502 73l225 455q19 41 49 41z" />
+    <glyph glyph-name="heart_empty" unicode="&#xf08a;" horiz-adv-x="1792" 
+d="M1664 940q0 81 -21.5 143t-55 98.5t-81.5 59.5t-94 31t-98 8t-112 -25.5t-110.5 -64t-86.5 -72t-60 -61.5q-18 -22 -49 -22t-49 22q-24 28 -60 61.5t-86.5 72t-110.5 64t-112 25.5t-98 -8t-94 -31t-81.5 -59.5t-55 -98.5t-21.5 -143q0 -168 187 -355l581 -560l580 559
+q188 188 188 356zM1792 940q0 -221 -229 -450l-623 -600q-18 -18 -44 -18t-44 18l-624 602q-10 8 -27.5 26t-55.5 65.5t-68 97.5t-53.5 121t-23.5 138q0 220 127 344t351 124q62 0 126.5 -21.5t120 -58t95.5 -68.5t76 -68q36 36 76 68t95.5 68.5t120 58t126.5 21.5
+q224 0 351 -124t127 -344z" />
+    <glyph glyph-name="signout" unicode="&#xf08b;" horiz-adv-x="1664" 
+d="M640 96q0 -4 1 -20t0.5 -26.5t-3 -23.5t-10 -19.5t-20.5 -6.5h-320q-119 0 -203.5 84.5t-84.5 203.5v704q0 119 84.5 203.5t203.5 84.5h320q13 0 22.5 -9.5t9.5 -22.5q0 -4 1 -20t0.5 -26.5t-3 -23.5t-10 -19.5t-20.5 -6.5h-320q-66 0 -113 -47t-47 -113v-704
+q0 -66 47 -113t113 -47h288h11h13t11.5 -1t11.5 -3t8 -5.5t7 -9t2 -13.5zM1568 640q0 -26 -19 -45l-544 -544q-19 -19 -45 -19t-45 19t-19 45v288h-448q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h448v288q0 26 19 45t45 19t45 -19l544 -544q19 -19 19 -45z" />
+    <glyph glyph-name="linkedin_sign" unicode="&#xf08c;" 
+d="M237 122h231v694h-231v-694zM483 1030q-1 52 -36 86t-93 34t-94.5 -34t-36.5 -86q0 -51 35.5 -85.5t92.5 -34.5h1q59 0 95 34.5t36 85.5zM1068 122h231v398q0 154 -73 233t-193 79q-136 0 -209 -117h2v101h-231q3 -66 0 -694h231v388q0 38 7 56q15 35 45 59.5t74 24.5
+q116 0 116 -157v-371zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="pushpin" unicode="&#xf08d;" horiz-adv-x="1152" 
+d="M480 672v448q0 14 -9 23t-23 9t-23 -9t-9 -23v-448q0 -14 9 -23t23 -9t23 9t9 23zM1152 320q0 -26 -19 -45t-45 -19h-429l-51 -483q-2 -12 -10.5 -20.5t-20.5 -8.5h-1q-27 0 -32 27l-76 485h-404q-26 0 -45 19t-19 45q0 123 78.5 221.5t177.5 98.5v512q-52 0 -90 38
+t-38 90t38 90t90 38h640q52 0 90 -38t38 -90t-38 -90t-90 -38v-512q99 0 177.5 -98.5t78.5 -221.5z" />
+    <glyph glyph-name="external_link" unicode="&#xf08e;" horiz-adv-x="1792" 
+d="M1408 608v-320q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h704q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-704q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832q66 0 113 47t47 113v320
+q0 14 9 23t23 9h64q14 0 23 -9t9 -23zM1792 1472v-512q0 -26 -19 -45t-45 -19t-45 19l-176 176l-652 -652q-10 -10 -23 -10t-23 10l-114 114q-10 10 -10 23t10 23l652 652l-176 176q-19 19 -19 45t19 45t45 19h512q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="signin" unicode="&#xf090;" 
+d="M1184 640q0 -26 -19 -45l-544 -544q-19 -19 -45 -19t-45 19t-19 45v288h-448q-26 0 -45 19t-19 45v384q0 26 19 45t45 19h448v288q0 26 19 45t45 19t45 -19l544 -544q19 -19 19 -45zM1536 992v-704q0 -119 -84.5 -203.5t-203.5 -84.5h-320q-13 0 -22.5 9.5t-9.5 22.5
+q0 4 -1 20t-0.5 26.5t3 23.5t10 19.5t20.5 6.5h320q66 0 113 47t47 113v704q0 66 -47 113t-113 47h-288h-11h-13t-11.5 1t-11.5 3t-8 5.5t-7 9t-2 13.5q0 4 -1 20t-0.5 26.5t3 23.5t10 19.5t20.5 6.5h320q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="trophy" unicode="&#xf091;" horiz-adv-x="1664" 
+d="M458 653q-74 162 -74 371h-256v-96q0 -78 94.5 -162t235.5 -113zM1536 928v96h-256q0 -209 -74 -371q141 29 235.5 113t94.5 162zM1664 1056v-128q0 -71 -41.5 -143t-112 -130t-173 -97.5t-215.5 -44.5q-42 -54 -95 -95q-38 -34 -52.5 -72.5t-14.5 -89.5q0 -54 30.5 -91
+t97.5 -37q75 0 133.5 -45.5t58.5 -114.5v-64q0 -14 -9 -23t-23 -9h-832q-14 0 -23 9t-9 23v64q0 69 58.5 114.5t133.5 45.5q67 0 97.5 37t30.5 91q0 51 -14.5 89.5t-52.5 72.5q-53 41 -95 95q-113 5 -215.5 44.5t-173 97.5t-112 130t-41.5 143v128q0 40 28 68t68 28h288v96
+q0 66 47 113t113 47h576q66 0 113 -47t47 -113v-96h288q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="github_sign" unicode="&#xf092;" 
+d="M519 336q4 6 -3 13q-9 7 -14 2q-4 -6 3 -13q9 -7 14 -2zM491 377q-5 7 -12 4q-6 -4 0 -12q7 -8 12 -5q6 4 0 13zM450 417q2 4 -5 8q-7 2 -8 -2q-3 -5 4 -8q8 -2 9 2zM471 394q2 1 1.5 4.5t-3.5 5.5q-6 7 -10 3t1 -11q6 -6 11 -2zM557 319q2 7 -9 11q-9 3 -13 -4
+q-2 -7 9 -11q9 -3 13 4zM599 316q0 8 -12 8q-10 0 -10 -8t11 -8t11 8zM638 323q-2 7 -13 5t-9 -9q2 -8 12 -6t10 10zM1280 640q0 212 -150 362t-362 150t-362 -150t-150 -362q0 -167 98 -300.5t252 -185.5q18 -3 26.5 5t8.5 20q0 52 -1 95q-6 -1 -15.5 -2.5t-35.5 -2t-48 4
+t-43.5 20t-29.5 41.5q-23 59 -57 74q-2 1 -4.5 3.5l-8 8t-7 9.5t4 7.5t19.5 3.5q6 0 15 -2t30 -15.5t33 -35.5q16 -28 37.5 -42t43.5 -14t38 3.5t30 9.5q7 47 33 69q-49 6 -86 18.5t-73 39t-55.5 76t-19.5 119.5q0 79 53 137q-24 62 5 136q19 6 54.5 -7.5t60.5 -29.5l26 -16
+q58 17 128 17t128 -17q11 7 28.5 18t55.5 26t57 9q29 -74 5 -136q53 -58 53 -137q0 -57 -14 -100.5t-35.5 -70t-53.5 -44.5t-62.5 -26t-68.5 -12q35 -31 35 -95q0 -40 -0.5 -89t-0.5 -51q0 -12 8.5 -20t26.5 -5q154 52 252 185.5t98 300.5zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="upload_alt" unicode="&#xf093;" horiz-adv-x="1664" 
+d="M1280 64q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1536 64q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1664 288v-320q0 -40 -28 -68t-68 -28h-1472q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h427q21 -56 70.5 -92
+t110.5 -36h256q61 0 110.5 36t70.5 92h427q40 0 68 -28t28 -68zM1339 936q-17 -40 -59 -40h-256v-448q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v448h-256q-42 0 -59 40q-17 39 14 69l448 448q18 19 45 19t45 -19l448 -448q31 -30 14 -69z" />
+    <glyph glyph-name="lemon" unicode="&#xf094;" 
+d="M1407 710q0 44 -7 113.5t-18 96.5q-12 30 -17 44t-9 36.5t-4 48.5q0 23 5 68.5t5 67.5q0 37 -10 55q-4 1 -13 1q-19 0 -58 -4.5t-59 -4.5q-60 0 -176 24t-175 24q-43 0 -94.5 -11.5t-85 -23.5t-89.5 -34q-137 -54 -202 -103q-96 -73 -159.5 -189.5t-88 -236t-24.5 -248.5
+q0 -40 12.5 -120t12.5 -121q0 -23 -11 -66.5t-11 -65.5t12 -36.5t34 -14.5q24 0 72.5 11t73.5 11q57 0 169.5 -15.5t169.5 -15.5q181 0 284 36q129 45 235.5 152.5t166 245.5t59.5 275zM1535 712q0 -165 -70 -327.5t-196 -288t-281 -180.5q-124 -44 -326 -44
+q-57 0 -170 14.5t-169 14.5q-24 0 -72.5 -14.5t-73.5 -14.5q-73 0 -123.5 55.5t-50.5 128.5q0 24 11 68t11 67q0 40 -12.5 120.5t-12.5 121.5q0 111 18 217.5t54.5 209.5t100.5 194t150 156q78 59 232 120q194 78 316 78q60 0 175.5 -24t173.5 -24q19 0 57 5t58 5
+q81 0 118 -50.5t37 -134.5q0 -23 -5 -68t-5 -68q0 -13 2 -25t3.5 -16.5t7.5 -20.5t8 -20q16 -40 25 -118.5t9 -136.5z" />
+    <glyph glyph-name="phone" unicode="&#xf095;" horiz-adv-x="1408" 
+d="M1408 296q0 -27 -10 -70.5t-21 -68.5q-21 -50 -122 -106q-94 -51 -186 -51q-27 0 -53 3.5t-57.5 12.5t-47 14.5t-55.5 20.5t-49 18q-98 35 -175 83q-127 79 -264 216t-216 264q-48 77 -83 175q-3 9 -18 49t-20.5 55.5t-14.5 47t-12.5 57.5t-3.5 53q0 92 51 186
+q56 101 106 122q25 11 68.5 21t70.5 10q14 0 21 -3q18 -6 53 -76q11 -19 30 -54t35 -63.5t31 -53.5q3 -4 17.5 -25t21.5 -35.5t7 -28.5q0 -20 -28.5 -50t-62 -55t-62 -53t-28.5 -46q0 -9 5 -22.5t8.5 -20.5t14 -24t11.5 -19q76 -137 174 -235t235 -174q2 -1 19 -11.5t24 -14
+t20.5 -8.5t22.5 -5q18 0 46 28.5t53 62t55 62t50 28.5q14 0 28.5 -7t35.5 -21.5t25 -17.5q25 -15 53.5 -31t63.5 -35t54 -30q70 -35 76 -53q3 -7 3 -21z" />
+    <glyph glyph-name="check_empty" unicode="&#xf096;" horiz-adv-x="1408" 
+d="M1120 1280h-832q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832q66 0 113 47t47 113v832q0 66 -47 113t-113 47zM1408 1120v-832q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h832
+q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="bookmark_empty" unicode="&#xf097;" horiz-adv-x="1280" 
+d="M1152 1280h-1024v-1242l423 406l89 85l89 -85l423 -406v1242zM1164 1408q23 0 44 -9q33 -13 52.5 -41t19.5 -62v-1289q0 -34 -19.5 -62t-52.5 -41q-19 -8 -44 -8q-48 0 -83 32l-441 424l-441 -424q-36 -33 -83 -33q-23 0 -44 9q-33 13 -52.5 41t-19.5 62v1289
+q0 34 19.5 62t52.5 41q21 9 44 9h1048z" />
+    <glyph glyph-name="phone_sign" unicode="&#xf098;" 
+d="M1280 343q0 11 -2 16t-18 16.5t-40.5 25t-47.5 26.5t-45.5 25t-28.5 15q-5 3 -19 13t-25 15t-21 5q-15 0 -36.5 -20.5t-39.5 -45t-38.5 -45t-33.5 -20.5q-7 0 -16.5 3.5t-15.5 6.5t-17 9.5t-14 8.5q-99 55 -170 126.5t-127 170.5q-2 3 -8.5 14t-9.5 17t-6.5 15.5
+t-3.5 16.5q0 13 20.5 33.5t45 38.5t45 39.5t20.5 36.5q0 10 -5 21t-15 25t-13 19q-3 6 -15 28.5t-25 45.5t-26.5 47.5t-25 40.5t-16.5 18t-16 2q-48 0 -101 -22q-46 -21 -80 -94.5t-34 -130.5q0 -16 2.5 -34t5 -30.5t9 -33t10 -29.5t12.5 -33t11 -30q60 -164 216.5 -320.5
+t320.5 -216.5q6 -2 30 -11t33 -12.5t29.5 -10t33 -9t30.5 -5t34 -2.5q57 0 130.5 34t94.5 80q22 53 22 101zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z
+" />
+    <glyph glyph-name="twitter" unicode="&#xf099;" horiz-adv-x="1664" 
+d="M1620 1128q-67 -98 -162 -167q1 -14 1 -42q0 -130 -38 -259.5t-115.5 -248.5t-184.5 -210.5t-258 -146t-323 -54.5q-271 0 -496 145q35 -4 78 -4q225 0 401 138q-105 2 -188 64.5t-114 159.5q33 -5 61 -5q43 0 85 11q-112 23 -185.5 111.5t-73.5 205.5v4q68 -38 146 -41
+q-66 44 -105 115t-39 154q0 88 44 163q121 -149 294.5 -238.5t371.5 -99.5q-8 38 -8 74q0 134 94.5 228.5t228.5 94.5q140 0 236 -102q109 21 205 78q-37 -115 -142 -178q93 10 186 50z" />
+    <glyph glyph-name="facebook" unicode="&#xf09a;" horiz-adv-x="1024" 
+d="M959 1524v-264h-157q-86 0 -116 -36t-30 -108v-189h293l-39 -296h-254v-759h-306v759h-255v296h255v218q0 186 104 288.5t277 102.5q147 0 228 -12z" />
+    <glyph glyph-name="github" unicode="&#xf09b;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5q0 -251 -146.5 -451.5t-378.5 -277.5q-27 -5 -40 7t-13 30q0 3 0.5 76.5t0.5 134.5q0 97 -52 142q57 6 102.5 18t94 39t81 66.5t53 105t20.5 150.5q0 119 -79 206q37 91 -8 204q-28 9 -81 -11t-92 -44l-38 -24
+q-93 26 -192 26t-192 -26q-16 11 -42.5 27t-83.5 38.5t-85 13.5q-45 -113 -8 -204q-79 -87 -79 -206q0 -85 20.5 -150t52.5 -105t80.5 -67t94 -39t102.5 -18q-39 -36 -49 -103q-21 -10 -45 -15t-57 -5t-65.5 21.5t-55.5 62.5q-19 32 -48.5 52t-49.5 24l-20 3q-21 0 -29 -4.5
+t-5 -11.5t9 -14t13 -12l7 -5q22 -10 43.5 -38t31.5 -51l10 -23q13 -38 44 -61.5t67 -30t69.5 -7t55.5 3.5l23 4q0 -38 0.5 -88.5t0.5 -54.5q0 -18 -13 -30t-40 -7q-232 77 -378.5 277.5t-146.5 451.5q0 209 103 385.5t279.5 279.5t385.5 103zM291 305q3 7 -7 12
+q-10 3 -13 -2q-3 -7 7 -12q9 -6 13 2zM322 271q7 5 -2 16q-10 9 -16 3q-7 -5 2 -16q10 -10 16 -3zM352 226q9 7 0 19q-8 13 -17 6q-9 -5 0 -18t17 -7zM394 184q8 8 -4 19q-12 12 -20 3q-9 -8 4 -19q12 -12 20 -3zM451 159q3 11 -13 16q-15 4 -19 -7t13 -15q15 -6 19 6z
+M514 154q0 13 -17 11q-16 0 -16 -11q0 -13 17 -11q16 0 16 11zM572 164q-2 11 -18 9q-16 -3 -14 -15t18 -8t14 14z" />
+    <glyph glyph-name="unlock" unicode="&#xf09c;" horiz-adv-x="1664" 
+d="M1664 960v-256q0 -26 -19 -45t-45 -19h-64q-26 0 -45 19t-19 45v256q0 106 -75 181t-181 75t-181 -75t-75 -181v-192h96q40 0 68 -28t28 -68v-576q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v576q0 40 28 68t68 28h672v192q0 185 131.5 316.5t316.5 131.5
+t316.5 -131.5t131.5 -316.5z" />
+    <glyph glyph-name="credit_card" unicode="&#xf09d;" horiz-adv-x="1920" 
+d="M1760 1408q66 0 113 -47t47 -113v-1216q0 -66 -47 -113t-113 -47h-1600q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1600zM160 1280q-13 0 -22.5 -9.5t-9.5 -22.5v-224h1664v224q0 13 -9.5 22.5t-22.5 9.5h-1600zM1760 0q13 0 22.5 9.5t9.5 22.5v608h-1664v-608
+q0 -13 9.5 -22.5t22.5 -9.5h1600zM256 128v128h256v-128h-256zM640 128v128h384v-128h-384z" />
+    <glyph glyph-name="rss" unicode="&#xf09e;" horiz-adv-x="1408" 
+d="M384 192q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM896 69q2 -28 -17 -48q-18 -21 -47 -21h-135q-25 0 -43 16.5t-20 41.5q-22 229 -184.5 391.5t-391.5 184.5q-25 2 -41.5 20t-16.5 43v135q0 29 21 47q17 17 43 17h5q160 -13 306 -80.5
+t259 -181.5q114 -113 181.5 -259t80.5 -306zM1408 67q2 -27 -18 -47q-18 -20 -46 -20h-143q-26 0 -44.5 17.5t-19.5 42.5q-12 215 -101 408.5t-231.5 336t-336 231.5t-408.5 102q-25 1 -42.5 19.5t-17.5 43.5v143q0 28 20 46q18 18 44 18h3q262 -13 501.5 -120t425.5 -294
+q187 -186 294 -425.5t120 -501.5z" />
+    <glyph glyph-name="hdd" unicode="&#xf0a0;" 
+d="M1040 320q0 -33 -23.5 -56.5t-56.5 -23.5t-56.5 23.5t-23.5 56.5t23.5 56.5t56.5 23.5t56.5 -23.5t23.5 -56.5zM1296 320q0 -33 -23.5 -56.5t-56.5 -23.5t-56.5 23.5t-23.5 56.5t23.5 56.5t56.5 23.5t56.5 -23.5t23.5 -56.5zM1408 160v320q0 13 -9.5 22.5t-22.5 9.5
+h-1216q-13 0 -22.5 -9.5t-9.5 -22.5v-320q0 -13 9.5 -22.5t22.5 -9.5h1216q13 0 22.5 9.5t9.5 22.5zM178 640h1180l-157 482q-4 13 -16 21.5t-26 8.5h-782q-14 0 -26 -8.5t-16 -21.5zM1536 480v-320q0 -66 -47 -113t-113 -47h-1216q-66 0 -113 47t-47 113v320q0 25 16 75
+l197 606q17 53 63 86t101 33h782q55 0 101 -33t63 -86l197 -606q16 -50 16 -75z" />
+    <glyph glyph-name="bullhorn" unicode="&#xf0a1;" horiz-adv-x="1792" 
+d="M1664 896q53 0 90.5 -37.5t37.5 -90.5t-37.5 -90.5t-90.5 -37.5v-384q0 -52 -38 -90t-90 -38q-417 347 -812 380q-58 -19 -91 -66t-31 -100.5t40 -92.5q-20 -33 -23 -65.5t6 -58t33.5 -55t48 -50t61.5 -50.5q-29 -58 -111.5 -83t-168.5 -11.5t-132 55.5q-7 23 -29.5 87.5
+t-32 94.5t-23 89t-15 101t3.5 98.5t22 110.5h-122q-66 0 -113 47t-47 113v192q0 66 47 113t113 47h480q435 0 896 384q52 0 90 -38t38 -90v-384zM1536 292v954q-394 -302 -768 -343v-270q377 -42 768 -341z" />
+    <glyph glyph-name="bell" unicode="&#xf0a2;" horiz-adv-x="1792" 
+d="M912 -160q0 16 -16 16q-59 0 -101.5 42.5t-42.5 101.5q0 16 -16 16t-16 -16q0 -73 51.5 -124.5t124.5 -51.5q16 0 16 16zM246 128h1300q-266 300 -266 832q0 51 -24 105t-69 103t-121.5 80.5t-169.5 31.5t-169.5 -31.5t-121.5 -80.5t-69 -103t-24 -105q0 -532 -266 -832z
+M1728 128q0 -52 -38 -90t-90 -38h-448q0 -106 -75 -181t-181 -75t-181 75t-75 181h-448q-52 0 -90 38t-38 90q50 42 91 88t85 119.5t74.5 158.5t50 206t19.5 260q0 152 117 282.5t307 158.5q-8 19 -8 39q0 40 28 68t68 28t68 -28t28 -68q0 -20 -8 -39q190 -28 307 -158.5
+t117 -282.5q0 -139 19.5 -260t50 -206t74.5 -158.5t85 -119.5t91 -88z" />
+    <glyph glyph-name="certificate" unicode="&#xf0a3;" 
+d="M1376 640l138 -135q30 -28 20 -70q-12 -41 -52 -51l-188 -48l53 -186q12 -41 -19 -70q-29 -31 -70 -19l-186 53l-48 -188q-10 -40 -51 -52q-12 -2 -19 -2q-31 0 -51 22l-135 138l-135 -138q-28 -30 -70 -20q-41 11 -51 52l-48 188l-186 -53q-41 -12 -70 19q-31 29 -19 70
+l53 186l-188 48q-40 10 -52 51q-10 42 20 70l138 135l-138 135q-30 28 -20 70q12 41 52 51l188 48l-53 186q-12 41 19 70q29 31 70 19l186 -53l48 188q10 41 51 51q41 12 70 -19l135 -139l135 139q29 30 70 19q41 -10 51 -51l48 -188l186 53q41 12 70 -19q31 -29 19 -70
+l-53 -186l188 -48q40 -10 52 -51q10 -42 -20 -70z" />
+    <glyph glyph-name="hand_right" unicode="&#xf0a4;" horiz-adv-x="1792" 
+d="M256 192q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1664 768q0 51 -39 89.5t-89 38.5h-576q0 20 15 48.5t33 55t33 68t15 84.5q0 67 -44.5 97.5t-115.5 30.5q-24 0 -90 -139q-24 -44 -37 -65q-40 -64 -112 -145q-71 -81 -101 -106
+q-69 -57 -140 -57h-32v-640h32q72 0 167 -32t193.5 -64t179.5 -32q189 0 189 167q0 26 -5 56q30 16 47.5 52.5t17.5 73.5t-18 69q53 50 53 119q0 25 -10 55.5t-25 47.5h331q52 0 90 38t38 90zM1792 769q0 -105 -75.5 -181t-180.5 -76h-169q-4 -62 -37 -119q3 -21 3 -43
+q0 -101 -60 -178q1 -139 -85 -219.5t-227 -80.5q-133 0 -322 69q-164 59 -223 59h-288q-53 0 -90.5 37.5t-37.5 90.5v640q0 53 37.5 90.5t90.5 37.5h288q10 0 21.5 4.5t23.5 14t22.5 18t24 22.5t20.5 21.5t19 21.5t14 17q65 74 100 129q13 21 33 62t37 72t40.5 63t55 49.5
+t69.5 17.5q125 0 206.5 -67t81.5 -189q0 -68 -22 -128h374q104 0 180 -76t76 -179z" />
+    <glyph glyph-name="hand_left" unicode="&#xf0a5;" horiz-adv-x="1792" 
+d="M1376 128h32v640h-32q-35 0 -67.5 12t-62.5 37t-50 46t-49 54q-8 9 -12 14q-72 81 -112 145q-14 22 -38 68q-1 3 -10.5 22.5t-18.5 36t-20 35.5t-21.5 30.5t-18.5 11.5q-71 0 -115.5 -30.5t-44.5 -97.5q0 -43 15 -84.5t33 -68t33 -55t15 -48.5h-576q-50 0 -89 -38.5
+t-39 -89.5q0 -52 38 -90t90 -38h331q-15 -17 -25 -47.5t-10 -55.5q0 -69 53 -119q-18 -32 -18 -69t17.5 -73.5t47.5 -52.5q-4 -24 -4 -56q0 -85 48.5 -126t135.5 -41q84 0 183 32t194 64t167 32zM1664 192q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45z
+M1792 768v-640q0 -53 -37.5 -90.5t-90.5 -37.5h-288q-59 0 -223 -59q-190 -69 -317 -69q-142 0 -230 77.5t-87 217.5l1 5q-61 76 -61 178q0 22 3 43q-33 57 -37 119h-169q-105 0 -180.5 76t-75.5 181q0 103 76 179t180 76h374q-22 60 -22 128q0 122 81.5 189t206.5 67
+q38 0 69.5 -17.5t55 -49.5t40.5 -63t37 -72t33 -62q35 -55 100 -129q2 -3 14 -17t19 -21.5t20.5 -21.5t24 -22.5t22.5 -18t23.5 -14t21.5 -4.5h288q53 0 90.5 -37.5t37.5 -90.5z" />
+    <glyph glyph-name="hand_up" unicode="&#xf0a6;" 
+d="M1280 -64q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1408 700q0 189 -167 189q-26 0 -56 -5q-16 30 -52.5 47.5t-73.5 17.5t-69 -18q-50 53 -119 53q-25 0 -55.5 -10t-47.5 -25v331q0 52 -38 90t-90 38q-51 0 -89.5 -39t-38.5 -89v-576
+q-20 0 -48.5 15t-55 33t-68 33t-84.5 15q-67 0 -97.5 -44.5t-30.5 -115.5q0 -24 139 -90q44 -24 65 -37q64 -40 145 -112q81 -71 106 -101q57 -69 57 -140v-32h640v32q0 72 32 167t64 193.5t32 179.5zM1536 705q0 -133 -69 -322q-59 -164 -59 -223v-288q0 -53 -37.5 -90.5
+t-90.5 -37.5h-640q-53 0 -90.5 37.5t-37.5 90.5v288q0 10 -4.5 21.5t-14 23.5t-18 22.5t-22.5 24t-21.5 20.5t-21.5 19t-17 14q-74 65 -129 100q-21 13 -62 33t-72 37t-63 40.5t-49.5 55t-17.5 69.5q0 125 67 206.5t189 81.5q68 0 128 -22v374q0 104 76 180t179 76
+q105 0 181 -75.5t76 -180.5v-169q62 -4 119 -37q21 3 43 3q101 0 178 -60q139 1 219.5 -85t80.5 -227z" />
+    <glyph glyph-name="hand_down" unicode="&#xf0a7;" 
+d="M1408 576q0 84 -32 183t-64 194t-32 167v32h-640v-32q0 -35 -12 -67.5t-37 -62.5t-46 -50t-54 -49q-9 -8 -14 -12q-81 -72 -145 -112q-22 -14 -68 -38q-3 -1 -22.5 -10.5t-36 -18.5t-35.5 -20t-30.5 -21.5t-11.5 -18.5q0 -71 30.5 -115.5t97.5 -44.5q43 0 84.5 15t68 33
+t55 33t48.5 15v-576q0 -50 38.5 -89t89.5 -39q52 0 90 38t38 90v331q46 -35 103 -35q69 0 119 53q32 -18 69 -18t73.5 17.5t52.5 47.5q24 -4 56 -4q85 0 126 48.5t41 135.5zM1280 1344q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1536 580
+q0 -142 -77.5 -230t-217.5 -87l-5 1q-76 -61 -178 -61q-22 0 -43 3q-54 -30 -119 -37v-169q0 -105 -76 -180.5t-181 -75.5q-103 0 -179 76t-76 180v374q-54 -22 -128 -22q-121 0 -188.5 81.5t-67.5 206.5q0 38 17.5 69.5t49.5 55t63 40.5t72 37t62 33q55 35 129 100
+q3 2 17 14t21.5 19t21.5 20.5t22.5 24t18 22.5t14 23.5t4.5 21.5v288q0 53 37.5 90.5t90.5 37.5h640q53 0 90.5 -37.5t37.5 -90.5v-288q0 -59 59 -223q69 -190 69 -317z" />
+    <glyph glyph-name="circle_arrow_left" unicode="&#xf0a8;" 
+d="M1280 576v128q0 26 -19 45t-45 19h-502l189 189q19 19 19 45t-19 45l-91 91q-18 18 -45 18t-45 -18l-362 -362l-91 -91q-18 -18 -18 -45t18 -45l91 -91l362 -362q18 -18 45 -18t45 18l91 91q18 18 18 45t-18 45l-189 189h502q26 0 45 19t19 45zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="circle_arrow_right" unicode="&#xf0a9;" 
+d="M1285 640q0 27 -18 45l-91 91l-362 362q-18 18 -45 18t-45 -18l-91 -91q-18 -18 -18 -45t18 -45l189 -189h-502q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h502l-189 -189q-19 -19 -19 -45t19 -45l91 -91q18 -18 45 -18t45 18l362 362l91 91q18 18 18 45zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="circle_arrow_up" unicode="&#xf0aa;" 
+d="M1284 641q0 27 -18 45l-362 362l-91 91q-18 18 -45 18t-45 -18l-91 -91l-362 -362q-18 -18 -18 -45t18 -45l91 -91q18 -18 45 -18t45 18l189 189v-502q0 -26 19 -45t45 -19h128q26 0 45 19t19 45v502l189 -189q19 -19 45 -19t45 19l91 91q18 18 18 45zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="circle_arrow_down" unicode="&#xf0ab;" 
+d="M1284 639q0 27 -18 45l-91 91q-18 18 -45 18t-45 -18l-189 -189v502q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-502l-189 189q-19 19 -45 19t-45 -19l-91 -91q-18 -18 -18 -45t18 -45l362 -362l91 -91q18 -18 45 -18t45 18l91 91l362 362q18 18 18 45zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="globe" unicode="&#xf0ac;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM1042 887q-2 -1 -9.5 -9.5t-13.5 -9.5q2 0 4.5 5t5 11t3.5 7q6 7 22 15q14 6 52 12q34 8 51 -11
+q-2 2 9.5 13t14.5 12q3 2 15 4.5t15 7.5l2 22q-12 -1 -17.5 7t-6.5 21q0 -2 -6 -8q0 7 -4.5 8t-11.5 -1t-9 -1q-10 3 -15 7.5t-8 16.5t-4 15q-2 5 -9.5 11t-9.5 10q-1 2 -2.5 5.5t-3 6.5t-4 5.5t-5.5 2.5t-7 -5t-7.5 -10t-4.5 -5q-3 2 -6 1.5t-4.5 -1t-4.5 -3t-5 -3.5
+q-3 -2 -8.5 -3t-8.5 -2q15 5 -1 11q-10 4 -16 3q9 4 7.5 12t-8.5 14h5q-1 4 -8.5 8.5t-17.5 8.5t-13 6q-8 5 -34 9.5t-33 0.5q-5 -6 -4.5 -10.5t4 -14t3.5 -12.5q1 -6 -5.5 -13t-6.5 -12q0 -7 14 -15.5t10 -21.5q-3 -8 -16 -16t-16 -12q-5 -8 -1.5 -18.5t10.5 -16.5
+q2 -2 1.5 -4t-3.5 -4.5t-5.5 -4t-6.5 -3.5l-3 -2q-11 -5 -20.5 6t-13.5 26q-7 25 -16 30q-23 8 -29 -1q-5 13 -41 26q-25 9 -58 4q6 1 0 15q-7 15 -19 12q3 6 4 17.5t1 13.5q3 13 12 23q1 1 7 8.5t9.5 13.5t0.5 6q35 -4 50 11q5 5 11.5 17t10.5 17q9 6 14 5.5t14.5 -5.5
+t14.5 -5q14 -1 15.5 11t-7.5 20q12 -1 3 17q-4 7 -8 9q-12 4 -27 -5q-8 -4 2 -8q-1 1 -9.5 -10.5t-16.5 -17.5t-16 5q-1 1 -5.5 13.5t-9.5 13.5q-8 0 -16 -15q3 8 -11 15t-24 8q19 12 -8 27q-7 4 -20.5 5t-19.5 -4q-5 -7 -5.5 -11.5t5 -8t10.5 -5.5t11.5 -4t8.5 -3
+q14 -10 8 -14q-2 -1 -8.5 -3.5t-11.5 -4.5t-6 -4q-3 -4 0 -14t-2 -14q-5 5 -9 17.5t-7 16.5q7 -9 -25 -6l-10 1q-4 0 -16 -2t-20.5 -1t-13.5 8q-4 8 0 20q1 4 4 2q-4 3 -11 9.5t-10 8.5q-46 -15 -94 -41q6 -1 12 1q5 2 13 6.5t10 5.5q34 14 42 7l5 5q14 -16 20 -25
+q-7 4 -30 1q-20 -6 -22 -12q7 -12 5 -18q-4 3 -11.5 10t-14.5 11t-15 5q-16 0 -22 -1q-146 -80 -235 -222q7 -7 12 -8q4 -1 5 -9t2.5 -11t11.5 3q9 -8 3 -19q1 1 44 -27q19 -17 21 -21q3 -11 -10 -18q-1 2 -9 9t-9 4q-3 -5 0.5 -18.5t10.5 -12.5q-7 0 -9.5 -16t-2.5 -35.5
+t-1 -23.5l2 -1q-3 -12 5.5 -34.5t21.5 -19.5q-13 -3 20 -43q6 -8 8 -9q3 -2 12 -7.5t15 -10t10 -10.5q4 -5 10 -22.5t14 -23.5q-2 -6 9.5 -20t10.5 -23q-1 0 -2.5 -1t-2.5 -1q3 -7 15.5 -14t15.5 -13q1 -3 2 -10t3 -11t8 -2q2 20 -24 62q-15 25 -17 29q-3 5 -5.5 15.5
+t-4.5 14.5q2 0 6 -1.5t8.5 -3.5t7.5 -4t2 -3q-3 -7 2 -17.5t12 -18.5t17 -19t12 -13q6 -6 14 -19.5t0 -13.5q9 0 20 -10.5t17 -19.5q5 -8 8 -26t5 -24q2 -7 8.5 -13.5t12.5 -9.5l16 -8t13 -7q5 -2 18.5 -10.5t21.5 -11.5q10 -4 16 -4t14.5 2.5t13.5 3.5q15 2 29 -15t21 -21
+q36 -19 55 -11q-2 -1 0.5 -7.5t8 -15.5t9 -14.5t5.5 -8.5q5 -6 18 -15t18 -15q6 4 7 9q-3 -8 7 -20t18 -10q14 3 14 32q-31 -15 -49 18q0 1 -2.5 5.5t-4 8.5t-2.5 8.5t0 7.5t5 3q9 0 10 3.5t-2 12.5t-4 13q-1 8 -11 20t-12 15q-5 -9 -16 -8t-16 9q0 -1 -1.5 -5.5t-1.5 -6.5
+q-13 0 -15 1q1 3 2.5 17.5t3.5 22.5q1 4 5.5 12t7.5 14.5t4 12.5t-4.5 9.5t-17.5 2.5q-19 -1 -26 -20q-1 -3 -3 -10.5t-5 -11.5t-9 -7q-7 -3 -24 -2t-24 5q-13 8 -22.5 29t-9.5 37q0 10 2.5 26.5t3 25t-5.5 24.5q3 2 9 9.5t10 10.5q2 1 4.5 1.5t4.5 0t4 1.5t3 6q-1 1 -4 3
+q-3 3 -4 3q7 -3 28.5 1.5t27.5 -1.5q15 -11 22 2q0 1 -2.5 9.5t-0.5 13.5q5 -27 29 -9q3 -3 15.5 -5t17.5 -5q3 -2 7 -5.5t5.5 -4.5t5 0.5t8.5 6.5q10 -14 12 -24q11 -40 19 -44q7 -3 11 -2t4.5 9.5t0 14t-1.5 12.5l-1 8v18l-1 8q-15 3 -18.5 12t1.5 18.5t15 18.5q1 1 8 3.5
+t15.5 6.5t12.5 8q21 19 15 35q7 0 11 9q-1 0 -5 3t-7.5 5t-4.5 2q9 5 2 16q5 3 7.5 11t7.5 10q9 -12 21 -2q8 8 1 16q5 7 20.5 10.5t18.5 9.5q7 -2 8 2t1 12t3 12q4 5 15 9t13 5l17 11q3 4 0 4q18 -2 31 11q10 11 -6 20q3 6 -3 9.5t-15 5.5q3 1 11.5 0.5t10.5 1.5
+q15 10 -7 16q-17 5 -43 -12zM879 10q206 36 351 189q-3 3 -12.5 4.5t-12.5 3.5q-18 7 -24 8q1 7 -2.5 13t-8 9t-12.5 8t-11 7q-2 2 -7 6t-7 5.5t-7.5 4.5t-8.5 2t-10 -1l-3 -1q-3 -1 -5.5 -2.5t-5.5 -3t-4 -3t0 -2.5q-21 17 -36 22q-5 1 -11 5.5t-10.5 7t-10 1.5t-11.5 -7
+q-5 -5 -6 -15t-2 -13q-7 5 0 17.5t2 18.5q-3 6 -10.5 4.5t-12 -4.5t-11.5 -8.5t-9 -6.5t-8.5 -5.5t-8.5 -7.5q-3 -4 -6 -12t-5 -11q-2 4 -11.5 6.5t-9.5 5.5q2 -10 4 -35t5 -38q7 -31 -12 -48q-27 -25 -29 -40q-4 -22 12 -26q0 -7 -8 -20.5t-7 -21.5q0 -6 2 -16z" />
+    <glyph glyph-name="wrench" unicode="&#xf0ad;" horiz-adv-x="1664" 
+d="M384 64q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1028 484l-682 -682q-37 -37 -90 -37q-52 0 -91 37l-106 108q-38 36 -38 90q0 53 38 91l681 681q39 -98 114.5 -173.5t173.5 -114.5zM1662 919q0 -39 -23 -106q-47 -134 -164.5 -217.5
+t-258.5 -83.5q-185 0 -316.5 131.5t-131.5 316.5t131.5 316.5t316.5 131.5q58 0 121.5 -16.5t107.5 -46.5q16 -11 16 -28t-16 -28l-293 -169v-224l193 -107q5 3 79 48.5t135.5 81t70.5 35.5q15 0 23.5 -10t8.5 -25z" />
+    <glyph glyph-name="tasks" unicode="&#xf0ae;" horiz-adv-x="1792" 
+d="M1024 128h640v128h-640v-128zM640 640h1024v128h-1024v-128zM1280 1152h384v128h-384v-128zM1792 320v-256q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 832v-256q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19
+t-19 45v256q0 26 19 45t45 19h1664q26 0 45 -19t19 -45zM1792 1344v-256q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h1664q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="filter" unicode="&#xf0b0;" horiz-adv-x="1408" 
+d="M1403 1241q17 -41 -14 -70l-493 -493v-742q0 -42 -39 -59q-13 -5 -25 -5q-27 0 -45 19l-256 256q-19 19 -19 45v486l-493 493q-31 29 -14 70q17 39 59 39h1280q42 0 59 -39z" />
+    <glyph glyph-name="briefcase" unicode="&#xf0b1;" horiz-adv-x="1792" 
+d="M640 1280h512v128h-512v-128zM1792 640v-480q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v480h672v-160q0 -26 19 -45t45 -19h320q26 0 45 19t19 45v160h672zM1024 640v-128h-256v128h256zM1792 1120v-384h-1792v384q0 66 47 113t113 47h352v160q0 40 28 68
+t68 28h576q40 0 68 -28t28 -68v-160h352q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="fullscreen" unicode="&#xf0b2;" 
+d="M1283 995l-355 -355l355 -355l144 144q29 31 70 14q39 -17 39 -59v-448q0 -26 -19 -45t-45 -19h-448q-42 0 -59 40q-17 39 14 69l144 144l-355 355l-355 -355l144 -144q31 -30 14 -69q-17 -40 -59 -40h-448q-26 0 -45 19t-19 45v448q0 42 40 59q39 17 69 -14l144 -144
+l355 355l-355 355l-144 -144q-19 -19 -45 -19q-12 0 -24 5q-40 17 -40 59v448q0 26 19 45t45 19h448q42 0 59 -40q17 -39 -14 -69l-144 -144l355 -355l355 355l-144 144q-31 30 -14 69q17 40 59 40h448q26 0 45 -19t19 -45v-448q0 -42 -39 -59q-13 -5 -25 -5q-26 0 -45 19z
+" />
+    <glyph glyph-name="group" unicode="&#xf0c0;" horiz-adv-x="1920" 
+d="M593 640q-162 -5 -265 -128h-134q-82 0 -138 40.5t-56 118.5q0 353 124 353q6 0 43.5 -21t97.5 -42.5t119 -21.5q67 0 133 23q-5 -37 -5 -66q0 -139 81 -256zM1664 3q0 -120 -73 -189.5t-194 -69.5h-874q-121 0 -194 69.5t-73 189.5q0 53 3.5 103.5t14 109t26.5 108.5
+t43 97.5t62 81t85.5 53.5t111.5 20q10 0 43 -21.5t73 -48t107 -48t135 -21.5t135 21.5t107 48t73 48t43 21.5q61 0 111.5 -20t85.5 -53.5t62 -81t43 -97.5t26.5 -108.5t14 -109t3.5 -103.5zM640 1280q0 -106 -75 -181t-181 -75t-181 75t-75 181t75 181t181 75t181 -75
+t75 -181zM1344 896q0 -159 -112.5 -271.5t-271.5 -112.5t-271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5t271.5 -112.5t112.5 -271.5zM1920 671q0 -78 -56 -118.5t-138 -40.5h-134q-103 123 -265 128q81 117 81 256q0 29 -5 66q66 -23 133 -23q59 0 119 21.5t97.5 42.5
+t43.5 21q124 0 124 -353zM1792 1280q0 -106 -75 -181t-181 -75t-181 75t-75 181t75 181t181 75t181 -75t75 -181z" />
+    <glyph glyph-name="link" unicode="&#xf0c1;" horiz-adv-x="1664" 
+d="M1456 320q0 40 -28 68l-208 208q-28 28 -68 28q-42 0 -72 -32q3 -3 19 -18.5t21.5 -21.5t15 -19t13 -25.5t3.5 -27.5q0 -40 -28 -68t-68 -28q-15 0 -27.5 3.5t-25.5 13t-19 15t-21.5 21.5t-18.5 19q-33 -31 -33 -73q0 -40 28 -68l206 -207q27 -27 68 -27q40 0 68 26
+l147 146q28 28 28 67zM753 1025q0 40 -28 68l-206 207q-28 28 -68 28q-39 0 -68 -27l-147 -146q-28 -28 -28 -67q0 -40 28 -68l208 -208q27 -27 68 -27q42 0 72 31q-3 3 -19 18.5t-21.5 21.5t-15 19t-13 25.5t-3.5 27.5q0 40 28 68t68 28q15 0 27.5 -3.5t25.5 -13t19 -15
+t21.5 -21.5t18.5 -19q33 31 33 73zM1648 320q0 -120 -85 -203l-147 -146q-83 -83 -203 -83q-121 0 -204 85l-206 207q-83 83 -83 203q0 123 88 209l-88 88q-86 -88 -208 -88q-120 0 -204 84l-208 208q-84 84 -84 204t85 203l147 146q83 83 203 83q121 0 204 -85l206 -207
+q83 -83 83 -203q0 -123 -88 -209l88 -88q86 88 208 88q120 0 204 -84l208 -208q84 -84 84 -204z" />
+    <glyph glyph-name="cloud" unicode="&#xf0c2;" horiz-adv-x="1920" 
+d="M1920 384q0 -159 -112.5 -271.5t-271.5 -112.5h-1088q-185 0 -316.5 131.5t-131.5 316.5q0 132 71 241.5t187 163.5q-2 28 -2 43q0 212 150 362t362 150q158 0 286.5 -88t187.5 -230q70 62 166 62q106 0 181 -75t75 -181q0 -75 -41 -138q129 -30 213 -134.5t84 -239.5z
+" />
+    <glyph glyph-name="beaker" unicode="&#xf0c3;" horiz-adv-x="1664" 
+d="M1527 88q56 -89 21.5 -152.5t-140.5 -63.5h-1152q-106 0 -140.5 63.5t21.5 152.5l503 793v399h-64q-26 0 -45 19t-19 45t19 45t45 19h512q26 0 45 -19t19 -45t-19 -45t-45 -19h-64v-399zM748 813l-272 -429h712l-272 429l-20 31v37v399h-128v-399v-37z" />
+    <glyph glyph-name="cut" unicode="&#xf0c4;" horiz-adv-x="1792" 
+d="M960 640q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1260 576l507 -398q28 -20 25 -56q-5 -35 -35 -51l-128 -64q-13 -7 -29 -7q-17 0 -31 8l-690 387l-110 -66q-8 -4 -12 -5q14 -49 10 -97q-7 -77 -56 -147.5t-132 -123.5q-132 -84 -277 -84
+q-136 0 -222 78q-90 84 -79 207q7 76 56 147t131 124q132 84 278 84q83 0 151 -31q9 13 22 22l122 73l-122 73q-13 9 -22 22q-68 -31 -151 -31q-146 0 -278 84q-82 53 -131 124t-56 147q-5 59 15.5 113t63.5 93q85 79 222 79q145 0 277 -84q83 -52 132 -123t56 -148
+q4 -48 -10 -97q4 -1 12 -5l110 -66l690 387q14 8 31 8q16 0 29 -7l128 -64q30 -16 35 -51q3 -36 -25 -56zM579 836q46 42 21 108t-106 117q-92 59 -192 59q-74 0 -113 -36q-46 -42 -21 -108t106 -117q92 -59 192 -59q74 0 113 36zM494 91q81 51 106 117t-21 108
+q-39 36 -113 36q-100 0 -192 -59q-81 -51 -106 -117t21 -108q39 -36 113 -36q100 0 192 59zM672 704l96 -58v11q0 36 33 56l14 8l-79 47l-26 -26q-3 -3 -10 -11t-12 -12q-2 -2 -4 -3.5t-3 -2.5zM896 480l96 -32l736 576l-128 64l-768 -431v-113l-160 -96l9 -8q2 -2 7 -6
+q4 -4 11 -12t11 -12l26 -26zM1600 64l128 64l-520 408l-177 -138q-2 -3 -13 -7z" />
+    <glyph glyph-name="copy" unicode="&#xf0c5;" horiz-adv-x="1792" 
+d="M1696 1152q40 0 68 -28t28 -68v-1216q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v288h-544q-40 0 -68 28t-28 68v672q0 40 20 88t48 76l408 408q28 28 76 48t88 20h416q40 0 68 -28t28 -68v-328q68 40 128 40h416zM1152 939l-299 -299h299v299zM512 1323l-299 -299
+h299v299zM708 676l316 316v416h-384v-416q0 -40 -28 -68t-68 -28h-416v-640h512v256q0 40 20 88t48 76zM1664 -128v1152h-384v-416q0 -40 -28 -68t-68 -28h-416v-640h896z" />
+    <glyph glyph-name="paper_clip" unicode="&#xf0c6;" horiz-adv-x="1408" 
+d="M1404 151q0 -117 -79 -196t-196 -79q-135 0 -235 100l-777 776q-113 115 -113 271q0 159 110 270t269 111q158 0 273 -113l605 -606q10 -10 10 -22q0 -16 -30.5 -46.5t-46.5 -30.5q-13 0 -23 10l-606 607q-79 77 -181 77q-106 0 -179 -75t-73 -181q0 -105 76 -181
+l776 -777q63 -63 145 -63q64 0 106 42t42 106q0 82 -63 145l-581 581q-26 24 -60 24q-29 0 -48 -19t-19 -48q0 -32 25 -59l410 -410q10 -10 10 -22q0 -16 -31 -47t-47 -31q-12 0 -22 10l-410 410q-63 61 -63 149q0 82 57 139t139 57q88 0 149 -63l581 -581q100 -98 100 -235
+z" />
+    <glyph glyph-name="save" unicode="&#xf0c7;" 
+d="M384 0h768v384h-768v-384zM1280 0h128v896q0 14 -10 38.5t-20 34.5l-281 281q-10 10 -34 20t-39 10v-416q0 -40 -28 -68t-68 -28h-576q-40 0 -68 28t-28 68v416h-128v-1280h128v416q0 40 28 68t68 28h832q40 0 68 -28t28 -68v-416zM896 928v320q0 13 -9.5 22.5t-22.5 9.5
+h-192q-13 0 -22.5 -9.5t-9.5 -22.5v-320q0 -13 9.5 -22.5t22.5 -9.5h192q13 0 22.5 9.5t9.5 22.5zM1536 896v-928q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1344q0 40 28 68t68 28h928q40 0 88 -20t76 -48l280 -280q28 -28 48 -76t20 -88z" />
+    <glyph glyph-name="sign_blank" unicode="&#xf0c8;" 
+d="M1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="reorder" unicode="&#xf0c9;" 
+d="M1536 192v-128q0 -26 -19 -45t-45 -19h-1408q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1408q26 0 45 -19t19 -45zM1536 704v-128q0 -26 -19 -45t-45 -19h-1408q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1408q26 0 45 -19t19 -45zM1536 1216v-128q0 -26 -19 -45
+t-45 -19h-1408q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h1408q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="ul" unicode="&#xf0ca;" horiz-adv-x="1792" 
+d="M384 128q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM384 640q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1792 224v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1216q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5
+t22.5 9.5h1216q13 0 22.5 -9.5t9.5 -22.5zM384 1152q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1792 736v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1216q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1216q13 0 22.5 -9.5t9.5 -22.5z
+M1792 1248v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1216q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1216q13 0 22.5 -9.5t9.5 -22.5z" />
+    <glyph glyph-name="ol" unicode="&#xf0cb;" horiz-adv-x="1792" 
+d="M381 -84q0 -80 -54.5 -126t-135.5 -46q-106 0 -172 66l57 88q49 -45 106 -45q29 0 50.5 14.5t21.5 42.5q0 64 -105 56l-26 56q8 10 32.5 43.5t42.5 54t37 38.5v1q-16 0 -48.5 -1t-48.5 -1v-53h-106v152h333v-88l-95 -115q51 -12 81 -49t30 -88zM383 543v-159h-362
+q-6 36 -6 54q0 51 23.5 93t56.5 68t66 47.5t56.5 43.5t23.5 45q0 25 -14.5 38.5t-39.5 13.5q-46 0 -81 -58l-85 59q24 51 71.5 79.5t105.5 28.5q73 0 123 -41.5t50 -112.5q0 -50 -34 -91.5t-75 -64.5t-75.5 -50.5t-35.5 -52.5h127v60h105zM1792 224v-192q0 -13 -9.5 -22.5
+t-22.5 -9.5h-1216q-13 0 -22.5 9.5t-9.5 22.5v192q0 14 9 23t23 9h1216q13 0 22.5 -9.5t9.5 -22.5zM384 1123v-99h-335v99h107q0 41 0.5 121.5t0.5 121.5v12h-2q-8 -17 -50 -54l-71 76l136 127h106v-404h108zM1792 736v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1216
+q-13 0 -22.5 9.5t-9.5 22.5v192q0 14 9 23t23 9h1216q13 0 22.5 -9.5t9.5 -22.5zM1792 1248v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1216q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1216q13 0 22.5 -9.5t9.5 -22.5z" />
+    <glyph glyph-name="strikethrough" unicode="&#xf0cc;" horiz-adv-x="1792" 
+d="M1760 640q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1728q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h1728zM483 704q-28 35 -51 80q-48 98 -48 188q0 181 134 309q133 127 393 127q50 0 167 -19q66 -12 177 -48q10 -38 21 -118q14 -123 14 -183q0 -18 -5 -45l-12 -3l-84 6
+l-14 2q-50 149 -103 205q-88 91 -210 91q-114 0 -182 -59q-67 -58 -67 -146q0 -73 66 -140t279 -129q69 -20 173 -66q58 -28 95 -52h-743zM990 448h411q7 -39 7 -92q0 -111 -41 -212q-23 -56 -71 -104q-37 -35 -109 -81q-80 -48 -153 -66q-80 -21 -203 -21q-114 0 -195 23
+l-140 40q-57 16 -72 28q-8 8 -8 22v13q0 108 -2 156q-1 30 0 68l2 37v44l102 2q15 -34 30 -71t22.5 -56t12.5 -27q35 -57 80 -94q43 -36 105 -57q59 -22 132 -22q64 0 139 27q77 26 122 86q47 61 47 129q0 84 -81 157q-34 29 -137 71z" />
+    <glyph glyph-name="underline" unicode="&#xf0cd;" 
+d="M48 1313q-37 2 -45 4l-3 88q13 1 40 1q60 0 112 -4q132 -7 166 -7q86 0 168 3q116 4 146 5q56 0 86 2l-1 -14l2 -64v-9q-60 -9 -124 -9q-60 0 -79 -25q-13 -14 -13 -132q0 -13 0.5 -32.5t0.5 -25.5l1 -229l14 -280q6 -124 51 -202q35 -59 96 -92q88 -47 177 -47
+q104 0 191 28q56 18 99 51q48 36 65 64q36 56 53 114q21 73 21 229q0 79 -3.5 128t-11 122.5t-13.5 159.5l-4 59q-5 67 -24 88q-34 35 -77 34l-100 -2l-14 3l2 86h84l205 -10q76 -3 196 10l18 -2q6 -38 6 -51q0 -7 -4 -31q-45 -12 -84 -13q-73 -11 -79 -17q-15 -15 -15 -41
+q0 -7 1.5 -27t1.5 -31q8 -19 22 -396q6 -195 -15 -304q-15 -76 -41 -122q-38 -65 -112 -123q-75 -57 -182 -89q-109 -33 -255 -33q-167 0 -284 46q-119 47 -179 122q-61 76 -83 195q-16 80 -16 237v333q0 188 -17 213q-25 36 -147 39zM1536 -96v64q0 14 -9 23t-23 9h-1472
+q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h1472q14 0 23 9t9 23z" />
+    <glyph glyph-name="table" unicode="&#xf0ce;" horiz-adv-x="1664" 
+d="M512 160v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM512 544v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1024 160v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23
+v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM512 928v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1024 544v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1536 160v192
+q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1024 928v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1536 544v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192
+q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1536 928v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1664 1248v-1088q0 -66 -47 -113t-113 -47h-1344q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1344q66 0 113 -47t47 -113
+z" />
+    <glyph glyph-name="magic" unicode="&#xf0d0;" horiz-adv-x="1664" 
+d="M1190 955l293 293l-107 107l-293 -293zM1637 1248q0 -27 -18 -45l-1286 -1286q-18 -18 -45 -18t-45 18l-198 198q-18 18 -18 45t18 45l1286 1286q18 18 45 18t45 -18l198 -198q18 -18 18 -45zM286 1438l98 -30l-98 -30l-30 -98l-30 98l-98 30l98 30l30 98zM636 1276
+l196 -60l-196 -60l-60 -196l-60 196l-196 60l196 60l60 196zM1566 798l98 -30l-98 -30l-30 -98l-30 98l-98 30l98 30l30 98zM926 1438l98 -30l-98 -30l-30 -98l-30 98l-98 30l98 30l30 98z" />
+    <glyph glyph-name="truck" unicode="&#xf0d1;" horiz-adv-x="1792" 
+d="M640 128q0 52 -38 90t-90 38t-90 -38t-38 -90t38 -90t90 -38t90 38t38 90zM256 640h384v256h-158q-13 0 -22 -9l-195 -195q-9 -9 -9 -22v-30zM1536 128q0 52 -38 90t-90 38t-90 -38t-38 -90t38 -90t90 -38t90 38t38 90zM1792 1216v-1024q0 -15 -4 -26.5t-13.5 -18.5
+t-16.5 -11.5t-23.5 -6t-22.5 -2t-25.5 0t-22.5 0.5q0 -106 -75 -181t-181 -75t-181 75t-75 181h-384q0 -106 -75 -181t-181 -75t-181 75t-75 181h-64q-3 0 -22.5 -0.5t-25.5 0t-22.5 2t-23.5 6t-16.5 11.5t-13.5 18.5t-4 26.5q0 26 19 45t45 19v320q0 8 -0.5 35t0 38
+t2.5 34.5t6.5 37t14 30.5t22.5 30l198 198q19 19 50.5 32t58.5 13h160v192q0 26 19 45t45 19h1024q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="pinterest" unicode="&#xf0d2;" 
+d="M1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103q-111 0 -218 32q59 93 78 164q9 34 54 211q20 -39 73 -67.5t114 -28.5q121 0 216 68.5t147 188.5t52 270q0 114 -59.5 214t-172.5 163t-255 63q-105 0 -196 -29t-154.5 -77t-109 -110.5t-67 -129.5t-21.5 -134
+q0 -104 40 -183t117 -111q30 -12 38 20q2 7 8 31t8 30q6 23 -11 43q-51 61 -51 151q0 151 104.5 259.5t273.5 108.5q151 0 235.5 -82t84.5 -213q0 -170 -68.5 -289t-175.5 -119q-61 0 -98 43.5t-23 104.5q8 35 26.5 93.5t30 103t11.5 75.5q0 50 -27 83t-77 33
+q-62 0 -105 -57t-43 -142q0 -73 25 -122l-99 -418q-17 -70 -13 -177q-206 91 -333 281t-127 423q0 209 103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="pinterest_sign" unicode="&#xf0d3;" 
+d="M1248 1408q119 0 203.5 -84.5t84.5 -203.5v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-725q85 122 108 210q9 34 53 209q21 -39 73.5 -67t112.5 -28q181 0 295.5 147.5t114.5 373.5q0 84 -35 162.5t-96.5 139t-152.5 97t-197 36.5q-104 0 -194.5 -28.5t-153 -76.5
+t-107.5 -109.5t-66.5 -128t-21.5 -132.5q0 -102 39.5 -180t116.5 -110q13 -5 23.5 0t14.5 19q10 44 15 61q6 23 -11 42q-50 62 -50 150q0 150 103.5 256.5t270.5 106.5q149 0 232.5 -81t83.5 -210q0 -168 -67.5 -286t-173.5 -118q-60 0 -97 43.5t-23 103.5q8 34 26.5 92.5
+t29.5 102t11 74.5q0 49 -26.5 81.5t-75.5 32.5q-61 0 -103.5 -56.5t-42.5 -139.5q0 -72 24 -121l-98 -414q-24 -100 -7 -254h-183q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960z" />
+    <glyph glyph-name="google_plus_sign" unicode="&#xf0d4;" 
+d="M917 631q0 26 -6 64h-362v-132h217q-3 -24 -16.5 -50t-37.5 -53t-66.5 -44.5t-96.5 -17.5q-99 0 -169 71t-70 171t70 171t169 71q92 0 153 -59l104 101q-108 100 -257 100q-160 0 -272 -112.5t-112 -271.5t112 -271.5t272 -112.5q165 0 266.5 105t101.5 270zM1262 585
+h109v110h-109v110h-110v-110h-110v-110h110v-110h110v110zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="google_plus" unicode="&#xf0d5;" horiz-adv-x="2304" 
+d="M1437 623q0 -208 -87 -370.5t-248 -254t-369 -91.5q-149 0 -285 58t-234 156t-156 234t-58 285t58 285t156 234t234 156t285 58q286 0 491 -192l-199 -191q-117 113 -292 113q-123 0 -227.5 -62t-165.5 -168.5t-61 -232.5t61 -232.5t165.5 -168.5t227.5 -62
+q83 0 152.5 23t114.5 57.5t78.5 78.5t49 83t21.5 74h-416v252h692q12 -63 12 -122zM2304 745v-210h-209v-209h-210v209h-209v210h209v209h210v-209h209z" />
+    <glyph glyph-name="money" unicode="&#xf0d6;" horiz-adv-x="1920" 
+d="M768 384h384v96h-128v448h-114l-148 -137l77 -80q42 37 55 57h2v-288h-128v-96zM1280 640q0 -70 -21 -142t-59.5 -134t-101.5 -101t-138 -39t-138 39t-101.5 101t-59.5 134t-21 142t21 142t59.5 134t101.5 101t138 39t138 -39t101.5 -101t59.5 -134t21 -142zM1792 384
+v512q-106 0 -181 75t-75 181h-1152q0 -106 -75 -181t-181 -75v-512q106 0 181 -75t75 -181h1152q0 106 75 181t181 75zM1920 1216v-1152q0 -26 -19 -45t-45 -19h-1792q-26 0 -45 19t-19 45v1152q0 26 19 45t45 19h1792q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="caret_down" unicode="&#xf0d7;" horiz-adv-x="1024" 
+d="M1024 832q0 -26 -19 -45l-448 -448q-19 -19 -45 -19t-45 19l-448 448q-19 19 -19 45t19 45t45 19h896q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="caret_up" unicode="&#xf0d8;" horiz-adv-x="1024" 
+d="M1024 320q0 -26 -19 -45t-45 -19h-896q-26 0 -45 19t-19 45t19 45l448 448q19 19 45 19t45 -19l448 -448q19 -19 19 -45z" />
+    <glyph glyph-name="caret_left" unicode="&#xf0d9;" horiz-adv-x="640" 
+d="M640 1088v-896q0 -26 -19 -45t-45 -19t-45 19l-448 448q-19 19 -19 45t19 45l448 448q19 19 45 19t45 -19t19 -45z" />
+    <glyph glyph-name="caret_right" unicode="&#xf0da;" horiz-adv-x="640" 
+d="M576 640q0 -26 -19 -45l-448 -448q-19 -19 -45 -19t-45 19t-19 45v896q0 26 19 45t45 19t45 -19l448 -448q19 -19 19 -45z" />
+    <glyph glyph-name="columns" unicode="&#xf0db;" horiz-adv-x="1664" 
+d="M160 0h608v1152h-640v-1120q0 -13 9.5 -22.5t22.5 -9.5zM1536 32v1120h-640v-1152h608q13 0 22.5 9.5t9.5 22.5zM1664 1248v-1216q0 -66 -47 -113t-113 -47h-1344q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1344q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="sort" unicode="&#xf0dc;" horiz-adv-x="1024" 
+d="M1024 448q0 -26 -19 -45l-448 -448q-19 -19 -45 -19t-45 19l-448 448q-19 19 -19 45t19 45t45 19h896q26 0 45 -19t19 -45zM1024 832q0 -26 -19 -45t-45 -19h-896q-26 0 -45 19t-19 45t19 45l448 448q19 19 45 19t45 -19l448 -448q19 -19 19 -45z" />
+    <glyph glyph-name="sort_down" unicode="&#xf0dd;" horiz-adv-x="1024" 
+d="M1024 448q0 -26 -19 -45l-448 -448q-19 -19 -45 -19t-45 19l-448 448q-19 19 -19 45t19 45t45 19h896q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="sort_up" unicode="&#xf0de;" horiz-adv-x="1024" 
+d="M1024 832q0 -26 -19 -45t-45 -19h-896q-26 0 -45 19t-19 45t19 45l448 448q19 19 45 19t45 -19l448 -448q19 -19 19 -45z" />
+    <glyph glyph-name="envelope_alt" unicode="&#xf0e0;" horiz-adv-x="1792" 
+d="M1792 826v-794q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v794q44 -49 101 -87q362 -246 497 -345q57 -42 92.5 -65.5t94.5 -48t110 -24.5h1h1q51 0 110 24.5t94.5 48t92.5 65.5q170 123 498 345q57 39 100 87zM1792 1120q0 -79 -49 -151t-122 -123
+q-376 -261 -468 -325q-10 -7 -42.5 -30.5t-54 -38t-52 -32.5t-57.5 -27t-50 -9h-1h-1q-23 0 -50 9t-57.5 27t-52 32.5t-54 38t-42.5 30.5q-91 64 -262 182.5t-205 142.5q-62 42 -117 115.5t-55 136.5q0 78 41.5 130t118.5 52h1472q65 0 112.5 -47t47.5 -113z" />
+    <glyph glyph-name="linkedin" unicode="&#xf0e1;" 
+d="M349 911v-991h-330v991h330zM370 1217q1 -73 -50.5 -122t-135.5 -49h-2q-82 0 -132 49t-50 122q0 74 51.5 122.5t134.5 48.5t133 -48.5t51 -122.5zM1536 488v-568h-329v530q0 105 -40.5 164.5t-126.5 59.5q-63 0 -105.5 -34.5t-63.5 -85.5q-11 -30 -11 -81v-553h-329
+q2 399 2 647t-1 296l-1 48h329v-144h-2q20 32 41 56t56.5 52t87 43.5t114.5 15.5q171 0 275 -113.5t104 -332.5z" />
+    <glyph glyph-name="undo" unicode="&#xf0e2;" 
+d="M1536 640q0 -156 -61 -298t-164 -245t-245 -164t-298 -61q-172 0 -327 72.5t-264 204.5q-7 10 -6.5 22.5t8.5 20.5l137 138q10 9 25 9q16 -2 23 -12q73 -95 179 -147t225 -52q104 0 198.5 40.5t163.5 109.5t109.5 163.5t40.5 198.5t-40.5 198.5t-109.5 163.5
+t-163.5 109.5t-198.5 40.5q-98 0 -188 -35.5t-160 -101.5l137 -138q31 -30 14 -69q-17 -40 -59 -40h-448q-26 0 -45 19t-19 45v448q0 42 40 59q39 17 69 -14l130 -129q107 101 244.5 156.5t284.5 55.5q156 0 298 -61t245 -164t164 -245t61 -298z" />
+    <glyph glyph-name="legal" unicode="&#xf0e3;" horiz-adv-x="1792" 
+d="M1771 0q0 -53 -37 -90l-107 -108q-39 -37 -91 -37q-53 0 -90 37l-363 364q-38 36 -38 90q0 53 43 96l-256 256l-126 -126q-14 -14 -34 -14t-34 14q2 -2 12.5 -12t12.5 -13t10 -11.5t10 -13.5t6 -13.5t5.5 -16.5t1.5 -18q0 -38 -28 -68q-3 -3 -16.5 -18t-19 -20.5
+t-18.5 -16.5t-22 -15.5t-22 -9t-26 -4.5q-40 0 -68 28l-408 408q-28 28 -28 68q0 13 4.5 26t9 22t15.5 22t16.5 18.5t20.5 19t18 16.5q30 28 68 28q10 0 18 -1.5t16.5 -5.5t13.5 -6t13.5 -10t11.5 -10t13 -12.5t12 -12.5q-14 14 -14 34t14 34l348 348q14 14 34 14t34 -14
+q-2 2 -12.5 12t-12.5 13t-10 11.5t-10 13.5t-6 13.5t-5.5 16.5t-1.5 18q0 38 28 68q3 3 16.5 18t19 20.5t18.5 16.5t22 15.5t22 9t26 4.5q40 0 68 -28l408 -408q28 -28 28 -68q0 -13 -4.5 -26t-9 -22t-15.5 -22t-16.5 -18.5t-20.5 -19t-18 -16.5q-30 -28 -68 -28
+q-10 0 -18 1.5t-16.5 5.5t-13.5 6t-13.5 10t-11.5 10t-13 12.5t-12 12.5q14 -14 14 -34t-14 -34l-126 -126l256 -256q43 43 96 43q52 0 91 -37l363 -363q37 -39 37 -91z" />
+    <glyph glyph-name="dashboard" unicode="&#xf0e4;" horiz-adv-x="1792" 
+d="M384 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM576 832q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1004 351l101 382q6 26 -7.5 48.5t-38.5 29.5
+t-48 -6.5t-30 -39.5l-101 -382q-60 -5 -107 -43.5t-63 -98.5q-20 -77 20 -146t117 -89t146 20t89 117q16 60 -6 117t-72 91zM1664 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1024 1024q0 53 -37.5 90.5
+t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1472 832q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1792 384q0 -261 -141 -483q-19 -29 -54 -29h-1402q-35 0 -54 29
+q-141 221 -141 483q0 182 71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="comment_alt" unicode="&#xf0e5;" horiz-adv-x="1792" 
+d="M896 1152q-204 0 -381.5 -69.5t-282 -187.5t-104.5 -255q0 -112 71.5 -213.5t201.5 -175.5l87 -50l-27 -96q-24 -91 -70 -172q152 63 275 171l43 38l57 -6q69 -8 130 -8q204 0 381.5 69.5t282 187.5t104.5 255t-104.5 255t-282 187.5t-381.5 69.5zM1792 640
+q0 -174 -120 -321.5t-326 -233t-450 -85.5q-70 0 -145 8q-198 -175 -460 -242q-49 -14 -114 -22h-5q-15 0 -27 10.5t-16 27.5v1q-3 4 -0.5 12t2 10t4.5 9.5l6 9t7 8.5t8 9q7 8 31 34.5t34.5 38t31 39.5t32.5 51t27 59t26 76q-157 89 -247.5 220t-90.5 281q0 174 120 321.5
+t326 233t450 85.5t450 -85.5t326 -233t120 -321.5z" />
+    <glyph glyph-name="comments_alt" unicode="&#xf0e6;" horiz-adv-x="1792" 
+d="M704 1152q-153 0 -286 -52t-211.5 -141t-78.5 -191q0 -82 53 -158t149 -132l97 -56l-35 -84q34 20 62 39l44 31l53 -10q78 -14 153 -14q153 0 286 52t211.5 141t78.5 191t-78.5 191t-211.5 141t-286 52zM704 1280q191 0 353.5 -68.5t256.5 -186.5t94 -257t-94 -257
+t-256.5 -186.5t-353.5 -68.5q-86 0 -176 16q-124 -88 -278 -128q-36 -9 -86 -16h-3q-11 0 -20.5 8t-11.5 21q-1 3 -1 6.5t0.5 6.5t2 6l2.5 5t3.5 5.5t4 5t4.5 5t4 4.5q5 6 23 25t26 29.5t22.5 29t25 38.5t20.5 44q-124 72 -195 177t-71 224q0 139 94 257t256.5 186.5
+t353.5 68.5zM1526 111q10 -24 20.5 -44t25 -38.5t22.5 -29t26 -29.5t23 -25q1 -1 4 -4.5t4.5 -5t4 -5t3.5 -5.5l2.5 -5t2 -6t0.5 -6.5t-1 -6.5q-3 -14 -13 -22t-22 -7q-50 7 -86 16q-154 40 -278 128q-90 -16 -176 -16q-271 0 -472 132q58 -4 88 -4q161 0 309 45t264 129
+q125 92 192 212t67 254q0 77 -23 152q129 -71 204 -178t75 -230q0 -120 -71 -224.5t-195 -176.5z" />
+    <glyph glyph-name="bolt" unicode="&#xf0e7;" horiz-adv-x="896" 
+d="M885 970q18 -20 7 -44l-540 -1157q-13 -25 -42 -25q-4 0 -14 2q-17 5 -25.5 19t-4.5 30l197 808l-406 -101q-4 -1 -12 -1q-18 0 -31 11q-18 15 -13 39l201 825q4 14 16 23t28 9h328q19 0 32 -12.5t13 -29.5q0 -8 -5 -18l-171 -463l396 98q8 2 12 2q19 0 34 -15z" />
+    <glyph glyph-name="sitemap" unicode="&#xf0e8;" horiz-adv-x="1792" 
+d="M1792 288v-320q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h96v192h-512v-192h96q40 0 68 -28t28 -68v-320q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h96v192h-512v-192h96q40 0 68 -28t28 -68v-320
+q0 -40 -28 -68t-68 -28h-320q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h96v192q0 52 38 90t90 38h512v192h-96q-40 0 -68 28t-28 68v320q0 40 28 68t68 28h320q40 0 68 -28t28 -68v-320q0 -40 -28 -68t-68 -28h-96v-192h512q52 0 90 -38t38 -90v-192h96q40 0 68 -28t28 -68
+z" />
+    <glyph glyph-name="umbrella" unicode="&#xf0e9;" horiz-adv-x="1664" 
+d="M896 708v-580q0 -104 -76 -180t-180 -76t-180 76t-76 180q0 26 19 45t45 19t45 -19t19 -45q0 -50 39 -89t89 -39t89 39t39 89v580q33 11 64 11t64 -11zM1664 681q0 -13 -9.5 -22.5t-22.5 -9.5q-11 0 -23 10q-49 46 -93 69t-102 23q-68 0 -128 -37t-103 -97
+q-7 -10 -17.5 -28t-14.5 -24q-11 -17 -28 -17q-18 0 -29 17q-4 6 -14.5 24t-17.5 28q-43 60 -102.5 97t-127.5 37t-127.5 -37t-102.5 -97q-7 -10 -17.5 -28t-14.5 -24q-11 -17 -29 -17q-17 0 -28 17q-4 6 -14.5 24t-17.5 28q-43 60 -103 97t-128 37q-58 0 -102 -23t-93 -69
+q-12 -10 -23 -10q-13 0 -22.5 9.5t-9.5 22.5q0 5 1 7q45 183 172.5 319.5t298 204.5t360.5 68q140 0 274.5 -40t246.5 -113.5t194.5 -187t115.5 -251.5q1 -2 1 -7zM896 1408v-98q-42 2 -64 2t-64 -2v98q0 26 19 45t45 19t45 -19t19 -45z" />
+    <glyph glyph-name="paste" unicode="&#xf0ea;" horiz-adv-x="1792" 
+d="M768 -128h896v640h-416q-40 0 -68 28t-28 68v416h-384v-1152zM1024 1312v64q0 13 -9.5 22.5t-22.5 9.5h-704q-13 0 -22.5 -9.5t-9.5 -22.5v-64q0 -13 9.5 -22.5t22.5 -9.5h704q13 0 22.5 9.5t9.5 22.5zM1280 640h299l-299 299v-299zM1792 512v-672q0 -40 -28 -68t-68 -28
+h-960q-40 0 -68 28t-28 68v160h-544q-40 0 -68 28t-28 68v1344q0 40 28 68t68 28h1088q40 0 68 -28t28 -68v-328q21 -13 36 -28l408 -408q28 -28 48 -76t20 -88z" />
+    <glyph glyph-name="light_bulb" unicode="&#xf0eb;" horiz-adv-x="1024" 
+d="M736 960q0 -13 -9.5 -22.5t-22.5 -9.5t-22.5 9.5t-9.5 22.5q0 46 -54 71t-106 25q-13 0 -22.5 9.5t-9.5 22.5t9.5 22.5t22.5 9.5q50 0 99.5 -16t87 -54t37.5 -90zM896 960q0 72 -34.5 134t-90 101.5t-123 62t-136.5 22.5t-136.5 -22.5t-123 -62t-90 -101.5t-34.5 -134
+q0 -101 68 -180q10 -11 30.5 -33t30.5 -33q128 -153 141 -298h228q13 145 141 298q10 11 30.5 33t30.5 33q68 79 68 180zM1024 960q0 -155 -103 -268q-45 -49 -74.5 -87t-59.5 -95.5t-34 -107.5q47 -28 47 -82q0 -37 -25 -64q25 -27 25 -64q0 -52 -45 -81q13 -23 13 -47
+q0 -46 -31.5 -71t-77.5 -25q-20 -44 -60 -70t-87 -26t-87 26t-60 70q-46 0 -77.5 25t-31.5 71q0 24 13 47q-45 29 -45 81q0 37 25 64q-25 27 -25 64q0 54 47 82q-4 50 -34 107.5t-59.5 95.5t-74.5 87q-103 113 -103 268q0 99 44.5 184.5t117 142t164 89t186.5 32.5
+t186.5 -32.5t164 -89t117 -142t44.5 -184.5z" />
+    <glyph glyph-name="exchange" unicode="&#xf0ec;" horiz-adv-x="1792" 
+d="M1792 352v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-1376v-192q0 -13 -9.5 -22.5t-22.5 -9.5q-12 0 -24 10l-319 320q-9 9 -9 22q0 14 9 23l320 320q9 9 23 9q13 0 22.5 -9.5t9.5 -22.5v-192h1376q13 0 22.5 -9.5t9.5 -22.5zM1792 896q0 -14 -9 -23l-320 -320q-9 -9 -23 -9
+q-13 0 -22.5 9.5t-9.5 22.5v192h-1376q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h1376v192q0 14 9 23t23 9q12 0 24 -10l319 -319q9 -9 9 -23z" />
+    <glyph glyph-name="cloud_download" unicode="&#xf0ed;" horiz-adv-x="1920" 
+d="M1280 608q0 14 -9 23t-23 9h-224v352q0 13 -9.5 22.5t-22.5 9.5h-192q-13 0 -22.5 -9.5t-9.5 -22.5v-352h-224q-13 0 -22.5 -9.5t-9.5 -22.5q0 -14 9 -23l352 -352q9 -9 23 -9t23 9l351 351q10 12 10 24zM1920 384q0 -159 -112.5 -271.5t-271.5 -112.5h-1088
+q-185 0 -316.5 131.5t-131.5 316.5q0 130 70 240t188 165q-2 30 -2 43q0 212 150 362t362 150q156 0 285.5 -87t188.5 -231q71 62 166 62q106 0 181 -75t75 -181q0 -76 -41 -138q130 -31 213.5 -135.5t83.5 -238.5z" />
+    <glyph glyph-name="cloud_upload" unicode="&#xf0ee;" horiz-adv-x="1920" 
+d="M1280 672q0 14 -9 23l-352 352q-9 9 -23 9t-23 -9l-351 -351q-10 -12 -10 -24q0 -14 9 -23t23 -9h224v-352q0 -13 9.5 -22.5t22.5 -9.5h192q13 0 22.5 9.5t9.5 22.5v352h224q13 0 22.5 9.5t9.5 22.5zM1920 384q0 -159 -112.5 -271.5t-271.5 -112.5h-1088
+q-185 0 -316.5 131.5t-131.5 316.5q0 130 70 240t188 165q-2 30 -2 43q0 212 150 362t362 150q156 0 285.5 -87t188.5 -231q71 62 166 62q106 0 181 -75t75 -181q0 -76 -41 -138q130 -31 213.5 -135.5t83.5 -238.5z" />
+    <glyph glyph-name="user_md" unicode="&#xf0f0;" horiz-adv-x="1408" 
+d="M384 192q0 -26 -19 -45t-45 -19t-45 19t-19 45t19 45t45 19t45 -19t19 -45zM1408 131q0 -121 -73 -190t-194 -69h-874q-121 0 -194 69t-73 190q0 68 5.5 131t24 138t47.5 132.5t81 103t120 60.5q-22 -52 -22 -120v-203q-58 -20 -93 -70t-35 -111q0 -80 56 -136t136 -56
+t136 56t56 136q0 61 -35.5 111t-92.5 70v203q0 62 25 93q132 -104 295 -104t295 104q25 -31 25 -93v-64q-106 0 -181 -75t-75 -181v-89q-32 -29 -32 -71q0 -40 28 -68t68 -28t68 28t28 68q0 42 -32 71v89q0 52 38 90t90 38t90 -38t38 -90v-89q-32 -29 -32 -71q0 -40 28 -68
+t68 -28t68 28t28 68q0 42 -32 71v89q0 68 -34.5 127.5t-93.5 93.5q0 10 0.5 42.5t0 48t-2.5 41.5t-7 47t-13 40q68 -15 120 -60.5t81 -103t47.5 -132.5t24 -138t5.5 -131zM1088 1024q0 -159 -112.5 -271.5t-271.5 -112.5t-271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5
+t271.5 -112.5t112.5 -271.5z" />
+    <glyph glyph-name="stethoscope" unicode="&#xf0f1;" horiz-adv-x="1408" 
+d="M1280 832q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1408 832q0 -62 -35.5 -111t-92.5 -70v-395q0 -159 -131.5 -271.5t-316.5 -112.5t-316.5 112.5t-131.5 271.5v132q-164 20 -274 128t-110 252v512q0 26 19 45t45 19q6 0 16 -2q17 30 47 48
+t65 18q53 0 90.5 -37.5t37.5 -90.5t-37.5 -90.5t-90.5 -37.5q-33 0 -64 18v-402q0 -106 94 -181t226 -75t226 75t94 181v402q-31 -18 -64 -18q-53 0 -90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5q35 0 65 -18t47 -48q10 2 16 2q26 0 45 -19t19 -45v-512q0 -144 -110 -252
+t-274 -128v-132q0 -106 94 -181t226 -75t226 75t94 181v395q-57 21 -92.5 70t-35.5 111q0 80 56 136t136 56t136 -56t56 -136z" />
+    <glyph glyph-name="suitcase" unicode="&#xf0f2;" horiz-adv-x="1792" 
+d="M640 1152h512v128h-512v-128zM288 1152v-1280h-64q-92 0 -158 66t-66 158v832q0 92 66 158t158 66h64zM1408 1152v-1280h-1024v1280h128v160q0 40 28 68t68 28h576q40 0 68 -28t28 -68v-160h128zM1792 928v-832q0 -92 -66 -158t-158 -66h-64v1280h64q92 0 158 -66
+t66 -158z" />
+    <glyph glyph-name="bell_alt" unicode="&#xf0f3;" horiz-adv-x="1792" 
+d="M912 -160q0 16 -16 16q-59 0 -101.5 42.5t-42.5 101.5q0 16 -16 16t-16 -16q0 -73 51.5 -124.5t124.5 -51.5q16 0 16 16zM1728 128q0 -52 -38 -90t-90 -38h-448q0 -106 -75 -181t-181 -75t-181 75t-75 181h-448q-52 0 -90 38t-38 90q50 42 91 88t85 119.5t74.5 158.5
+t50 206t19.5 260q0 152 117 282.5t307 158.5q-8 19 -8 39q0 40 28 68t68 28t68 -28t28 -68q0 -20 -8 -39q190 -28 307 -158.5t117 -282.5q0 -139 19.5 -260t50 -206t74.5 -158.5t85 -119.5t91 -88z" />
+    <glyph glyph-name="coffee" unicode="&#xf0f4;" horiz-adv-x="1920" 
+d="M1664 896q0 80 -56 136t-136 56h-64v-384h64q80 0 136 56t56 136zM0 128h1792q0 -106 -75 -181t-181 -75h-1280q-106 0 -181 75t-75 181zM1856 896q0 -159 -112.5 -271.5t-271.5 -112.5h-64v-32q0 -92 -66 -158t-158 -66h-704q-92 0 -158 66t-66 158v736q0 26 19 45
+t45 19h1152q159 0 271.5 -112.5t112.5 -271.5z" />
+    <glyph glyph-name="food" unicode="&#xf0f5;" horiz-adv-x="1408" 
+d="M640 1472v-640q0 -61 -35.5 -111t-92.5 -70v-779q0 -52 -38 -90t-90 -38h-128q-52 0 -90 38t-38 90v779q-57 20 -92.5 70t-35.5 111v640q0 26 19 45t45 19t45 -19t19 -45v-416q0 -26 19 -45t45 -19t45 19t19 45v416q0 26 19 45t45 19t45 -19t19 -45v-416q0 -26 19 -45
+t45 -19t45 19t19 45v416q0 26 19 45t45 19t45 -19t19 -45zM1408 1472v-1600q0 -52 -38 -90t-90 -38h-128q-52 0 -90 38t-38 90v512h-224q-13 0 -22.5 9.5t-9.5 22.5v800q0 132 94 226t226 94h256q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="file_text_alt" unicode="&#xf0f6;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M384 736q0 14 9 23t23 9h704q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-704q-14 0 -23 9t-9 23v64zM1120 512q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-704q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h704zM1120 256q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-704
+q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h704z" />
+    <glyph glyph-name="building" unicode="&#xf0f7;" horiz-adv-x="1408" 
+d="M384 224v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M1152 224v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM896 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 992v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M1152 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM896 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 992v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 1248v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M1152 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM896 992v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 1248v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM1152 992v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M896 1248v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM1152 1248v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M896 -128h384v1536h-1152v-1536h384v224q0 13 9.5 22.5t22.5 9.5h320q13 0 22.5 -9.5t9.5 -22.5v-224zM1408 1472v-1664q0 -26 -19 -45t-45 -19h-1280q-26 0 -45 19t-19 45v1664q0 26 19 45t45 19h1280q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="hospital" unicode="&#xf0f8;" horiz-adv-x="1408" 
+d="M384 224v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM384 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M1152 224v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM896 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M640 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM1152 480v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M896 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5zM1152 736v-64q0 -13 -9.5 -22.5t-22.5 -9.5h-64q-13 0 -22.5 9.5t-9.5 22.5v64q0 13 9.5 22.5t22.5 9.5h64q13 0 22.5 -9.5t9.5 -22.5z
+M896 -128h384v1152h-256v-32q0 -40 -28 -68t-68 -28h-448q-40 0 -68 28t-28 68v32h-256v-1152h384v224q0 13 9.5 22.5t22.5 9.5h320q13 0 22.5 -9.5t9.5 -22.5v-224zM896 1056v320q0 13 -9.5 22.5t-22.5 9.5h-64q-13 0 -22.5 -9.5t-9.5 -22.5v-96h-128v96q0 13 -9.5 22.5
+t-22.5 9.5h-64q-13 0 -22.5 -9.5t-9.5 -22.5v-320q0 -13 9.5 -22.5t22.5 -9.5h64q13 0 22.5 9.5t9.5 22.5v96h128v-96q0 -13 9.5 -22.5t22.5 -9.5h64q13 0 22.5 9.5t9.5 22.5zM1408 1088v-1280q0 -26 -19 -45t-45 -19h-1280q-26 0 -45 19t-19 45v1280q0 26 19 45t45 19h320
+v288q0 40 28 68t68 28h448q40 0 68 -28t28 -68v-288h320q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="ambulance" unicode="&#xf0f9;" horiz-adv-x="1920" 
+d="M640 128q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM256 640h384v256h-158q-14 -2 -22 -9l-195 -195q-7 -12 -9 -22v-30zM1536 128q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5
+t90.5 37.5t37.5 90.5zM1664 800v192q0 14 -9 23t-23 9h-224v224q0 14 -9 23t-23 9h-192q-14 0 -23 -9t-9 -23v-224h-224q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h224v-224q0 -14 9 -23t23 -9h192q14 0 23 9t9 23v224h224q14 0 23 9t9 23zM1920 1344v-1152
+q0 -26 -19 -45t-45 -19h-192q0 -106 -75 -181t-181 -75t-181 75t-75 181h-384q0 -106 -75 -181t-181 -75t-181 75t-75 181h-128q-26 0 -45 19t-19 45t19 45t45 19v416q0 26 13 58t32 51l198 198q19 19 51 32t58 13h160v320q0 26 19 45t45 19h1152q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="medkit" unicode="&#xf0fa;" horiz-adv-x="1792" 
+d="M1280 416v192q0 14 -9 23t-23 9h-224v224q0 14 -9 23t-23 9h-192q-14 0 -23 -9t-9 -23v-224h-224q-14 0 -23 -9t-9 -23v-192q0 -14 9 -23t23 -9h224v-224q0 -14 9 -23t23 -9h192q14 0 23 9t9 23v224h224q14 0 23 9t9 23zM640 1152h512v128h-512v-128zM256 1152v-1280h-32
+q-92 0 -158 66t-66 158v832q0 92 66 158t158 66h32zM1440 1152v-1280h-1088v1280h160v160q0 40 28 68t68 28h576q40 0 68 -28t28 -68v-160h160zM1792 928v-832q0 -92 -66 -158t-158 -66h-32v1280h32q92 0 158 -66t66 -158z" />
+    <glyph glyph-name="fighter_jet" unicode="&#xf0fb;" horiz-adv-x="1920" 
+d="M1920 576q-1 -32 -288 -96l-352 -32l-224 -64h-64l-293 -352h69q26 0 45 -4.5t19 -11.5t-19 -11.5t-45 -4.5h-96h-160h-64v32h64v416h-160l-192 -224h-96l-32 32v192h32v32h128v8l-192 24v128l192 24v8h-128v32h-32v192l32 32h96l192 -224h160v416h-64v32h64h160h96
+q26 0 45 -4.5t19 -11.5t-19 -11.5t-45 -4.5h-69l293 -352h64l224 -64l352 -32q128 -28 200 -52t80 -34z" />
+    <glyph glyph-name="beer" unicode="&#xf0fc;" horiz-adv-x="1664" 
+d="M640 640v384h-256v-256q0 -53 37.5 -90.5t90.5 -37.5h128zM1664 192v-192h-1152v192l128 192h-128q-159 0 -271.5 112.5t-112.5 271.5v320l-64 64l32 128h480l32 128h960l32 -192l-64 -32v-800z" />
+    <glyph glyph-name="h_sign" unicode="&#xf0fd;" 
+d="M1280 192v896q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-320h-512v320q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-896q0 -26 19 -45t45 -19h128q26 0 45 19t19 45v320h512v-320q0 -26 19 -45t45 -19h128q26 0 45 19t19 45zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="f0fe" unicode="&#xf0fe;" 
+d="M1280 576v128q0 26 -19 45t-45 19h-320v320q0 26 -19 45t-45 19h-128q-26 0 -45 -19t-19 -45v-320h-320q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h320v-320q0 -26 19 -45t45 -19h128q26 0 45 19t19 45v320h320q26 0 45 19t19 45zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="double_angle_left" unicode="&#xf100;" horiz-adv-x="1024" 
+d="M627 160q0 -13 -10 -23l-50 -50q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l50 -50q10 -10 10 -23t-10 -23l-393 -393l393 -393q10 -10 10 -23zM1011 160q0 -13 -10 -23l-50 -50q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23
+t10 23l466 466q10 10 23 10t23 -10l50 -50q10 -10 10 -23t-10 -23l-393 -393l393 -393q10 -10 10 -23z" />
+    <glyph glyph-name="double_angle_right" unicode="&#xf101;" horiz-adv-x="1024" 
+d="M595 576q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l393 393l-393 393q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l466 -466q10 -10 10 -23zM979 576q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23
+l393 393l-393 393q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l466 -466q10 -10 10 -23z" />
+    <glyph glyph-name="double_angle_up" unicode="&#xf102;" horiz-adv-x="1152" 
+d="M1075 224q0 -13 -10 -23l-50 -50q-10 -10 -23 -10t-23 10l-393 393l-393 -393q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l466 -466q10 -10 10 -23zM1075 608q0 -13 -10 -23l-50 -50q-10 -10 -23 -10t-23 10l-393 393l-393 -393
+q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l466 -466q10 -10 10 -23z" />
+    <glyph glyph-name="double_angle_down" unicode="&#xf103;" horiz-adv-x="1152" 
+d="M1075 672q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l393 -393l393 393q10 10 23 10t23 -10l50 -50q10 -10 10 -23zM1075 1056q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23
+t10 23l50 50q10 10 23 10t23 -10l393 -393l393 393q10 10 23 10t23 -10l50 -50q10 -10 10 -23z" />
+    <glyph glyph-name="angle_left" unicode="&#xf104;" horiz-adv-x="640" 
+d="M627 992q0 -13 -10 -23l-393 -393l393 -393q10 -10 10 -23t-10 -23l-50 -50q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l50 -50q10 -10 10 -23z" />
+    <glyph glyph-name="angle_right" unicode="&#xf105;" horiz-adv-x="640" 
+d="M595 576q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l393 393l-393 393q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l466 -466q10 -10 10 -23z" />
+    <glyph glyph-name="angle_up" unicode="&#xf106;" horiz-adv-x="1152" 
+d="M1075 352q0 -13 -10 -23l-50 -50q-10 -10 -23 -10t-23 10l-393 393l-393 -393q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l466 -466q10 -10 10 -23z" />
+    <glyph glyph-name="angle_down" unicode="&#xf107;" horiz-adv-x="1152" 
+d="M1075 800q0 -13 -10 -23l-466 -466q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l393 -393l393 393q10 10 23 10t23 -10l50 -50q10 -10 10 -23z" />
+    <glyph glyph-name="desktop" unicode="&#xf108;" horiz-adv-x="1920" 
+d="M1792 544v832q0 13 -9.5 22.5t-22.5 9.5h-1600q-13 0 -22.5 -9.5t-9.5 -22.5v-832q0 -13 9.5 -22.5t22.5 -9.5h1600q13 0 22.5 9.5t9.5 22.5zM1920 1376v-1088q0 -66 -47 -113t-113 -47h-544q0 -37 16 -77.5t32 -71t16 -43.5q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19
+t-19 45q0 14 16 44t32 70t16 78h-544q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1600q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="laptop" unicode="&#xf109;" horiz-adv-x="1920" 
+d="M416 256q-66 0 -113 47t-47 113v704q0 66 47 113t113 47h1088q66 0 113 -47t47 -113v-704q0 -66 -47 -113t-113 -47h-1088zM384 1120v-704q0 -13 9.5 -22.5t22.5 -9.5h1088q13 0 22.5 9.5t9.5 22.5v704q0 13 -9.5 22.5t-22.5 9.5h-1088q-13 0 -22.5 -9.5t-9.5 -22.5z
+M1760 192h160v-96q0 -40 -47 -68t-113 -28h-1600q-66 0 -113 28t-47 68v96h160h1600zM1040 96q16 0 16 16t-16 16h-160q-16 0 -16 -16t16 -16h160z" />
+    <glyph glyph-name="tablet" unicode="&#xf10a;" horiz-adv-x="1152" 
+d="M640 128q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1024 288v960q0 13 -9.5 22.5t-22.5 9.5h-832q-13 0 -22.5 -9.5t-9.5 -22.5v-960q0 -13 9.5 -22.5t22.5 -9.5h832q13 0 22.5 9.5t9.5 22.5zM1152 1248v-1088q0 -66 -47 -113t-113 -47h-832
+q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h832q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="mobile_phone" unicode="&#xf10b;" horiz-adv-x="768" 
+d="M464 128q0 33 -23.5 56.5t-56.5 23.5t-56.5 -23.5t-23.5 -56.5t23.5 -56.5t56.5 -23.5t56.5 23.5t23.5 56.5zM672 288v704q0 13 -9.5 22.5t-22.5 9.5h-512q-13 0 -22.5 -9.5t-9.5 -22.5v-704q0 -13 9.5 -22.5t22.5 -9.5h512q13 0 22.5 9.5t9.5 22.5zM480 1136
+q0 16 -16 16h-160q-16 0 -16 -16t16 -16h160q16 0 16 16zM768 1152v-1024q0 -52 -38 -90t-90 -38h-512q-52 0 -90 38t-38 90v1024q0 52 38 90t90 38h512q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="circle_blank" unicode="&#xf10c;" 
+d="M768 1184q-148 0 -273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273t-73 273t-198 198t-273 73zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103
+t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="quote_left" unicode="&#xf10d;" horiz-adv-x="1664" 
+d="M768 576v-384q0 -80 -56 -136t-136 -56h-384q-80 0 -136 56t-56 136v704q0 104 40.5 198.5t109.5 163.5t163.5 109.5t198.5 40.5h64q26 0 45 -19t19 -45v-128q0 -26 -19 -45t-45 -19h-64q-106 0 -181 -75t-75 -181v-32q0 -40 28 -68t68 -28h224q80 0 136 -56t56 -136z
+M1664 576v-384q0 -80 -56 -136t-136 -56h-384q-80 0 -136 56t-56 136v704q0 104 40.5 198.5t109.5 163.5t163.5 109.5t198.5 40.5h64q26 0 45 -19t19 -45v-128q0 -26 -19 -45t-45 -19h-64q-106 0 -181 -75t-75 -181v-32q0 -40 28 -68t68 -28h224q80 0 136 -56t56 -136z" />
+    <glyph glyph-name="quote_right" unicode="&#xf10e;" horiz-adv-x="1664" 
+d="M768 1216v-704q0 -104 -40.5 -198.5t-109.5 -163.5t-163.5 -109.5t-198.5 -40.5h-64q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h64q106 0 181 75t75 181v32q0 40 -28 68t-68 28h-224q-80 0 -136 56t-56 136v384q0 80 56 136t136 56h384q80 0 136 -56t56 -136zM1664 1216
+v-704q0 -104 -40.5 -198.5t-109.5 -163.5t-163.5 -109.5t-198.5 -40.5h-64q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h64q106 0 181 75t75 181v32q0 40 -28 68t-68 28h-224q-80 0 -136 56t-56 136v384q0 80 56 136t136 56h384q80 0 136 -56t56 -136z" />
+    <glyph glyph-name="spinner" unicode="&#xf110;" horiz-adv-x="1792" 
+d="M526 142q0 -53 -37.5 -90.5t-90.5 -37.5q-52 0 -90 38t-38 90q0 53 37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1024 -64q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM320 640q0 -53 -37.5 -90.5t-90.5 -37.5
+t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1522 142q0 -52 -38 -90t-90 -38q-53 0 -90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM558 1138q0 -66 -47 -113t-113 -47t-113 47t-47 113t47 113t113 47t113 -47t47 -113z
+M1728 640q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1088 1344q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1618 1138q0 -93 -66 -158.5t-158 -65.5q-93 0 -158.5 65.5t-65.5 158.5
+q0 92 65.5 158t158.5 66q92 0 158 -66t66 -158z" />
+    <glyph glyph-name="circle" unicode="&#xf111;" 
+d="M1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="reply" unicode="&#xf112;" horiz-adv-x="1792" 
+d="M1792 416q0 -166 -127 -451q-3 -7 -10.5 -24t-13.5 -30t-13 -22q-12 -17 -28 -17q-15 0 -23.5 10t-8.5 25q0 9 2.5 26.5t2.5 23.5q5 68 5 123q0 101 -17.5 181t-48.5 138.5t-80 101t-105.5 69.5t-133 42.5t-154 21.5t-175.5 6h-224v-256q0 -26 -19 -45t-45 -19t-45 19
+l-512 512q-19 19 -19 45t19 45l512 512q19 19 45 19t45 -19t19 -45v-256h224q713 0 875 -403q53 -134 53 -333z" />
+    <glyph glyph-name="github_alt" unicode="&#xf113;" horiz-adv-x="1664" 
+d="M640 320q0 -40 -12.5 -82t-43 -76t-72.5 -34t-72.5 34t-43 76t-12.5 82t12.5 82t43 76t72.5 34t72.5 -34t43 -76t12.5 -82zM1280 320q0 -40 -12.5 -82t-43 -76t-72.5 -34t-72.5 34t-43 76t-12.5 82t12.5 82t43 76t72.5 34t72.5 -34t43 -76t12.5 -82zM1440 320
+q0 120 -69 204t-187 84q-41 0 -195 -21q-71 -11 -157 -11t-157 11q-152 21 -195 21q-118 0 -187 -84t-69 -204q0 -88 32 -153.5t81 -103t122 -60t140 -29.5t149 -7h168q82 0 149 7t140 29.5t122 60t81 103t32 153.5zM1664 496q0 -207 -61 -331q-38 -77 -105.5 -133t-141 -86
+t-170 -47.5t-171.5 -22t-167 -4.5q-78 0 -142 3t-147.5 12.5t-152.5 30t-137 51.5t-121 81t-86 115q-62 123 -62 331q0 237 136 396q-27 82 -27 170q0 116 51 218q108 0 190 -39.5t189 -123.5q147 35 309 35q148 0 280 -32q105 82 187 121t189 39q51 -102 51 -218
+q0 -87 -27 -168q136 -160 136 -398z" />
+    <glyph glyph-name="folder_close_alt" unicode="&#xf114;" horiz-adv-x="1664" 
+d="M1536 224v704q0 40 -28 68t-68 28h-704q-40 0 -68 28t-28 68v64q0 40 -28 68t-68 28h-320q-40 0 -68 -28t-28 -68v-960q0 -40 28 -68t68 -28h1216q40 0 68 28t28 68zM1664 928v-704q0 -92 -66 -158t-158 -66h-1216q-92 0 -158 66t-66 158v960q0 92 66 158t158 66h320
+q92 0 158 -66t66 -158v-32h672q92 0 158 -66t66 -158z" />
+    <glyph glyph-name="folder_open_alt" unicode="&#xf115;" horiz-adv-x="1920" 
+d="M1781 605q0 35 -53 35h-1088q-40 0 -85.5 -21.5t-71.5 -52.5l-294 -363q-18 -24 -18 -40q0 -35 53 -35h1088q40 0 86 22t71 53l294 363q18 22 18 39zM640 768h768v160q0 40 -28 68t-68 28h-576q-40 0 -68 28t-28 68v64q0 40 -28 68t-68 28h-320q-40 0 -68 -28t-28 -68
+v-853l256 315q44 53 116 87.5t140 34.5zM1909 605q0 -62 -46 -120l-295 -363q-43 -53 -116 -87.5t-140 -34.5h-1088q-92 0 -158 66t-66 158v960q0 92 66 158t158 66h320q92 0 158 -66t66 -158v-32h544q92 0 158 -66t66 -158v-160h192q54 0 99 -24.5t67 -70.5q15 -32 15 -68z
+" />
+    <glyph glyph-name="expand_alt" unicode="&#xf116;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="collapse_alt" unicode="&#xf117;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="smile" unicode="&#xf118;" 
+d="M1134 461q-37 -121 -138 -195t-228 -74t-228 74t-138 195q-8 25 4 48.5t38 31.5q25 8 48.5 -4t31.5 -38q25 -80 92.5 -129.5t151.5 -49.5t151.5 49.5t92.5 129.5q8 26 32 38t49 4t37 -31.5t4 -48.5zM640 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5
+t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1152 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1408 640q0 130 -51 248.5t-136.5 204t-204 136.5t-248.5 51t-248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5
+t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="frown" unicode="&#xf119;" 
+d="M1134 307q8 -25 -4 -48.5t-37 -31.5t-49 4t-32 38q-25 80 -92.5 129.5t-151.5 49.5t-151.5 -49.5t-92.5 -129.5q-8 -26 -31.5 -38t-48.5 -4q-26 8 -38 31.5t-4 48.5q37 121 138 195t228 74t228 -74t138 -195zM640 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5
+t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1152 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1408 640q0 130 -51 248.5t-136.5 204t-204 136.5t-248.5 51t-248.5 -51t-204 -136.5t-136.5 -204
+t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="meh" unicode="&#xf11a;" 
+d="M1152 448q0 -26 -19 -45t-45 -19h-640q-26 0 -45 19t-19 45t19 45t45 19h640q26 0 45 -19t19 -45zM640 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1152 896q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5
+t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1408 640q0 130 -51 248.5t-136.5 204t-204 136.5t-248.5 51t-248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="gamepad" unicode="&#xf11b;" horiz-adv-x="1920" 
+d="M832 448v128q0 14 -9 23t-23 9h-192v192q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-192h-192q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h192v-192q0 -14 9 -23t23 -9h128q14 0 23 9t9 23v192h192q14 0 23 9t9 23zM1408 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5
+t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1664 640q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1920 512q0 -212 -150 -362t-362 -150q-192 0 -338 128h-220q-146 -128 -338 -128q-212 0 -362 150
+t-150 362t150 362t362 150h896q212 0 362 -150t150 -362z" />
+    <glyph glyph-name="keyboard" unicode="&#xf11c;" horiz-adv-x="1920" 
+d="M384 368v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM512 624v-96q0 -16 -16 -16h-224q-16 0 -16 16v96q0 16 16 16h224q16 0 16 -16zM384 880v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1408 368v-96q0 -16 -16 -16
+h-864q-16 0 -16 16v96q0 16 16 16h864q16 0 16 -16zM768 624v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM640 880v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1024 624v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16
+h96q16 0 16 -16zM896 880v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1280 624v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1664 368v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1152 880v-96
+q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1408 880v-96q0 -16 -16 -16h-96q-16 0 -16 16v96q0 16 16 16h96q16 0 16 -16zM1664 880v-352q0 -16 -16 -16h-224q-16 0 -16 16v96q0 16 16 16h112v240q0 16 16 16h96q16 0 16 -16zM1792 128v896h-1664v-896
+h1664zM1920 1024v-896q0 -53 -37.5 -90.5t-90.5 -37.5h-1664q-53 0 -90.5 37.5t-37.5 90.5v896q0 53 37.5 90.5t90.5 37.5h1664q53 0 90.5 -37.5t37.5 -90.5z" />
+    <glyph glyph-name="flag_alt" unicode="&#xf11d;" horiz-adv-x="1792" 
+d="M1664 491v616q-169 -91 -306 -91q-82 0 -145 32q-100 49 -184 76.5t-178 27.5q-173 0 -403 -127v-599q245 113 433 113q55 0 103.5 -7.5t98 -26t77 -31t82.5 -39.5l28 -14q44 -22 101 -22q120 0 293 92zM320 1280q0 -35 -17.5 -64t-46.5 -46v-1266q0 -14 -9 -23t-23 -9
+h-64q-14 0 -23 9t-9 23v1266q-29 17 -46.5 46t-17.5 64q0 53 37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1792 1216v-763q0 -39 -35 -57q-10 -5 -17 -9q-218 -116 -369 -116q-88 0 -158 35l-28 14q-64 33 -99 48t-91 29t-114 14q-102 0 -235.5 -44t-228.5 -102
+q-15 -9 -33 -9q-16 0 -32 8q-32 19 -32 56v742q0 35 31 55q35 21 78.5 42.5t114 52t152.5 49.5t155 19q112 0 209 -31t209 -86q38 -19 89 -19q122 0 310 112q22 12 31 17q31 16 62 -2q31 -20 31 -55z" />
+    <glyph glyph-name="flag_checkered" unicode="&#xf11e;" horiz-adv-x="1792" 
+d="M832 536v192q-181 -16 -384 -117v-185q205 96 384 110zM832 954v197q-172 -8 -384 -126v-189q215 111 384 118zM1664 491v184q-235 -116 -384 -71v224q-20 6 -39 15q-5 3 -33 17t-34.5 17t-31.5 15t-34.5 15.5t-32.5 13t-36 12.5t-35 8.5t-39.5 7.5t-39.5 4t-44 2
+q-23 0 -49 -3v-222h19q102 0 192.5 -29t197.5 -82q19 -9 39 -15v-188q42 -17 91 -17q120 0 293 92zM1664 918v189q-169 -91 -306 -91q-45 0 -78 8v-196q148 -42 384 90zM320 1280q0 -35 -17.5 -64t-46.5 -46v-1266q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v1266
+q-29 17 -46.5 46t-17.5 64q0 53 37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1792 1216v-763q0 -39 -35 -57q-10 -5 -17 -9q-218 -116 -369 -116q-88 0 -158 35l-28 14q-64 33 -99 48t-91 29t-114 14q-102 0 -235.5 -44t-228.5 -102q-15 -9 -33 -9q-16 0 -32 8
+q-32 19 -32 56v742q0 35 31 55q35 21 78.5 42.5t114 52t152.5 49.5t155 19q112 0 209 -31t209 -86q38 -19 89 -19q122 0 310 112q22 12 31 17q31 16 62 -2q31 -20 31 -55z" />
+    <glyph glyph-name="terminal" unicode="&#xf120;" horiz-adv-x="1664" 
+d="M585 553l-466 -466q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l393 393l-393 393q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l466 -466q10 -10 10 -23t-10 -23zM1664 96v-64q0 -14 -9 -23t-23 -9h-960q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h960q14 0 23 -9
+t9 -23z" />
+    <glyph glyph-name="code" unicode="&#xf121;" horiz-adv-x="1920" 
+d="M617 137l-50 -50q-10 -10 -23 -10t-23 10l-466 466q-10 10 -10 23t10 23l466 466q10 10 23 10t23 -10l50 -50q10 -10 10 -23t-10 -23l-393 -393l393 -393q10 -10 10 -23t-10 -23zM1208 1204l-373 -1291q-4 -13 -15.5 -19.5t-23.5 -2.5l-62 17q-13 4 -19.5 15.5t-2.5 24.5
+l373 1291q4 13 15.5 19.5t23.5 2.5l62 -17q13 -4 19.5 -15.5t2.5 -24.5zM1865 553l-466 -466q-10 -10 -23 -10t-23 10l-50 50q-10 10 -10 23t10 23l393 393l-393 393q-10 10 -10 23t10 23l50 50q10 10 23 10t23 -10l466 -466q10 -10 10 -23t-10 -23z" />
+    <glyph glyph-name="reply_all" unicode="&#xf122;" horiz-adv-x="1792" 
+d="M640 454v-70q0 -42 -39 -59q-13 -5 -25 -5q-27 0 -45 19l-512 512q-19 19 -19 45t19 45l512 512q29 31 70 14q39 -17 39 -59v-69l-397 -398q-19 -19 -19 -45t19 -45zM1792 416q0 -58 -17 -133.5t-38.5 -138t-48 -125t-40.5 -90.5l-20 -40q-8 -17 -28 -17q-6 0 -9 1
+q-25 8 -23 34q43 400 -106 565q-64 71 -170.5 110.5t-267.5 52.5v-251q0 -42 -39 -59q-13 -5 -25 -5q-27 0 -45 19l-512 512q-19 19 -19 45t19 45l512 512q29 31 70 14q39 -17 39 -59v-262q411 -28 599 -221q169 -173 169 -509z" />
+    <glyph glyph-name="star_half_empty" unicode="&#xf123;" horiz-adv-x="1664" 
+d="M1186 579l257 250l-356 52l-66 10l-30 60l-159 322v-963l59 -31l318 -168l-60 355l-12 66zM1638 841l-363 -354l86 -500q5 -33 -6 -51.5t-34 -18.5q-17 0 -40 12l-449 236l-449 -236q-23 -12 -40 -12q-23 0 -34 18.5t-6 51.5l86 500l-364 354q-32 32 -23 59.5t54 34.5
+l502 73l225 455q20 41 49 41q28 0 49 -41l225 -455l502 -73q45 -7 54 -34.5t-24 -59.5z" />
+    <glyph glyph-name="location_arrow" unicode="&#xf124;" horiz-adv-x="1408" 
+d="M1401 1187l-640 -1280q-17 -35 -57 -35q-5 0 -15 2q-22 5 -35.5 22.5t-13.5 39.5v576h-576q-22 0 -39.5 13.5t-22.5 35.5t4 42t29 30l1280 640q13 7 29 7q27 0 45 -19q15 -14 18.5 -34.5t-6.5 -39.5z" />
+    <glyph glyph-name="crop" unicode="&#xf125;" horiz-adv-x="1664" 
+d="M557 256h595v595zM512 301l595 595h-595v-595zM1664 224v-192q0 -14 -9 -23t-23 -9h-224v-224q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v224h-864q-14 0 -23 9t-9 23v864h-224q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h224v224q0 14 9 23t23 9h192q14 0 23 -9t9 -23
+v-224h851l246 247q10 9 23 9t23 -9q9 -10 9 -23t-9 -23l-247 -246v-851h224q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="code_fork" unicode="&#xf126;" horiz-adv-x="1024" 
+d="M288 64q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM288 1216q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM928 1088q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM1024 1088q0 -52 -26 -96.5t-70 -69.5
+q-2 -287 -226 -414q-67 -38 -203 -81q-128 -40 -169.5 -71t-41.5 -100v-26q44 -25 70 -69.5t26 -96.5q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 52 26 96.5t70 69.5v820q-44 25 -70 69.5t-26 96.5q0 80 56 136t136 56t136 -56t56 -136q0 -52 -26 -96.5t-70 -69.5v-497
+q54 26 154 57q55 17 87.5 29.5t70.5 31t59 39.5t40.5 51t28 69.5t8.5 91.5q-44 25 -70 69.5t-26 96.5q0 80 56 136t136 56t136 -56t56 -136z" />
+    <glyph glyph-name="unlink" unicode="&#xf127;" horiz-adv-x="1664" 
+d="M439 265l-256 -256q-11 -9 -23 -9t-23 9q-9 10 -9 23t9 23l256 256q10 9 23 9t23 -9q9 -10 9 -23t-9 -23zM608 224v-320q0 -14 -9 -23t-23 -9t-23 9t-9 23v320q0 14 9 23t23 9t23 -9t9 -23zM384 448q0 -14 -9 -23t-23 -9h-320q-14 0 -23 9t-9 23t9 23t23 9h320
+q14 0 23 -9t9 -23zM1648 320q0 -120 -85 -203l-147 -146q-83 -83 -203 -83q-121 0 -204 85l-334 335q-21 21 -42 56l239 18l273 -274q27 -27 68 -27.5t68 26.5l147 146q28 28 28 67q0 40 -28 68l-274 275l18 239q35 -21 56 -42l336 -336q84 -86 84 -204zM1031 1044l-239 -18
+l-273 274q-28 28 -68 28q-39 0 -68 -27l-147 -146q-28 -28 -28 -67q0 -40 28 -68l274 -274l-18 -240q-35 21 -56 42l-336 336q-84 86 -84 204q0 120 85 203l147 146q83 83 203 83q121 0 204 -85l334 -335q21 -21 42 -56zM1664 960q0 -14 -9 -23t-23 -9h-320q-14 0 -23 9
+t-9 23t9 23t23 9h320q14 0 23 -9t9 -23zM1120 1504v-320q0 -14 -9 -23t-23 -9t-23 9t-9 23v320q0 14 9 23t23 9t23 -9t9 -23zM1527 1353l-256 -256q-11 -9 -23 -9t-23 9q-9 10 -9 23t9 23l256 256q10 9 23 9t23 -9q9 -10 9 -23t-9 -23z" />
+    <glyph glyph-name="question" unicode="&#xf128;" horiz-adv-x="1024" 
+d="M704 280v-240q0 -16 -12 -28t-28 -12h-240q-16 0 -28 12t-12 28v240q0 16 12 28t28 12h240q16 0 28 -12t12 -28zM1020 880q0 -54 -15.5 -101t-35 -76.5t-55 -59.5t-57.5 -43.5t-61 -35.5q-41 -23 -68.5 -65t-27.5 -67q0 -17 -12 -32.5t-28 -15.5h-240q-15 0 -25.5 18.5
+t-10.5 37.5v45q0 83 65 156.5t143 108.5q59 27 84 56t25 76q0 42 -46.5 74t-107.5 32q-65 0 -108 -29q-35 -25 -107 -115q-13 -16 -31 -16q-12 0 -25 8l-164 125q-13 10 -15.5 25t5.5 28q160 266 464 266q80 0 161 -31t146 -83t106 -127.5t41 -158.5z" />
+    <glyph glyph-name="_279" unicode="&#xf129;" horiz-adv-x="640" 
+d="M640 192v-128q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h64v384h-64q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h384q26 0 45 -19t19 -45v-576h64q26 0 45 -19t19 -45zM512 1344v-192q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v192
+q0 26 19 45t45 19h256q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="exclamation" unicode="&#xf12a;" horiz-adv-x="640" 
+d="M512 288v-224q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v224q0 26 19 45t45 19h256q26 0 45 -19t19 -45zM542 1344l-28 -768q-1 -26 -20.5 -45t-45.5 -19h-256q-26 0 -45.5 19t-20.5 45l-28 768q-1 26 17.5 45t44.5 19h320q26 0 44.5 -19t17.5 -45z" />
+    <glyph glyph-name="superscript" unicode="&#xf12b;" 
+d="M897 167v-167h-248l-159 252l-24 42q-8 9 -11 21h-3q-1 -3 -2.5 -6.5t-3.5 -8t-3 -6.5q-10 -20 -25 -44l-155 -250h-258v167h128l197 291l-185 272h-137v168h276l139 -228q2 -4 23 -42q8 -9 11 -21h3q3 9 11 21l25 42l140 228h257v-168h-125l-184 -267l204 -296h109z
+M1534 846v-206h-514l-3 27q-4 28 -4 46q0 64 26 117t65 86.5t84 65t84 54.5t65 54t26 64q0 38 -29.5 62.5t-70.5 24.5q-51 0 -97 -39q-14 -11 -36 -38l-105 92q26 37 63 66q83 65 188 65q110 0 178 -59.5t68 -158.5q0 -56 -24.5 -103t-62 -76.5t-81.5 -58.5t-82 -50.5
+t-65.5 -51.5t-30.5 -63h232v80h126z" />
+    <glyph glyph-name="subscript" unicode="&#xf12c;" 
+d="M897 167v-167h-248l-159 252l-24 42q-8 9 -11 21h-3q-1 -3 -2.5 -6.5t-3.5 -8t-3 -6.5q-10 -20 -25 -44l-155 -250h-258v167h128l197 291l-185 272h-137v168h276l139 -228q2 -4 23 -42q8 -9 11 -21h3q3 9 11 21l25 42l140 228h257v-168h-125l-184 -267l204 -296h109z
+M1536 -50v-206h-514l-4 27q-3 45 -3 46q0 64 26 117t65 86.5t84 65t84 54.5t65 54t26 64q0 38 -29.5 62.5t-70.5 24.5q-51 0 -97 -39q-14 -11 -36 -38l-105 92q26 37 63 66q80 65 188 65q110 0 178 -59.5t68 -158.5q0 -66 -34.5 -118.5t-84 -86t-99.5 -62.5t-87 -63t-41 -73
+h232v80h126z" />
+    <glyph glyph-name="_283" unicode="&#xf12d;" horiz-adv-x="1920" 
+d="M896 128l336 384h-768l-336 -384h768zM1909 1205q15 -34 9.5 -71.5t-30.5 -65.5l-896 -1024q-38 -44 -96 -44h-768q-38 0 -69.5 20.5t-47.5 54.5q-15 34 -9.5 71.5t30.5 65.5l896 1024q38 44 96 44h768q38 0 69.5 -20.5t47.5 -54.5z" />
+    <glyph glyph-name="puzzle_piece" unicode="&#xf12e;" horiz-adv-x="1664" 
+d="M1664 438q0 -81 -44.5 -135t-123.5 -54q-41 0 -77.5 17.5t-59 38t-56.5 38t-71 17.5q-110 0 -110 -124q0 -39 16 -115t15 -115v-5q-22 0 -33 -1q-34 -3 -97.5 -11.5t-115.5 -13.5t-98 -5q-61 0 -103 26.5t-42 83.5q0 37 17.5 71t38 56.5t38 59t17.5 77.5q0 79 -54 123.5
+t-135 44.5q-84 0 -143 -45.5t-59 -127.5q0 -43 15 -83t33.5 -64.5t33.5 -53t15 -50.5q0 -45 -46 -89q-37 -35 -117 -35q-95 0 -245 24q-9 2 -27.5 4t-27.5 4l-13 2q-1 0 -3 1q-2 0 -2 1v1024q2 -1 17.5 -3.5t34 -5t21.5 -3.5q150 -24 245 -24q80 0 117 35q46 44 46 89
+q0 22 -15 50.5t-33.5 53t-33.5 64.5t-15 83q0 82 59 127.5t144 45.5q80 0 134 -44.5t54 -123.5q0 -41 -17.5 -77.5t-38 -59t-38 -56.5t-17.5 -71q0 -57 42 -83.5t103 -26.5q64 0 180 15t163 17v-2q-1 -2 -3.5 -17.5t-5 -34t-3.5 -21.5q-24 -150 -24 -245q0 -80 35 -117
+q44 -46 89 -46q22 0 50.5 15t53 33.5t64.5 33.5t83 15q82 0 127.5 -59t45.5 -143z" />
+    <glyph glyph-name="microphone" unicode="&#xf130;" horiz-adv-x="1152" 
+d="M1152 832v-128q0 -221 -147.5 -384.5t-364.5 -187.5v-132h256q26 0 45 -19t19 -45t-19 -45t-45 -19h-640q-26 0 -45 19t-19 45t19 45t45 19h256v132q-217 24 -364.5 187.5t-147.5 384.5v128q0 26 19 45t45 19t45 -19t19 -45v-128q0 -185 131.5 -316.5t316.5 -131.5
+t316.5 131.5t131.5 316.5v128q0 26 19 45t45 19t45 -19t19 -45zM896 1216v-512q0 -132 -94 -226t-226 -94t-226 94t-94 226v512q0 132 94 226t226 94t226 -94t94 -226z" />
+    <glyph glyph-name="microphone_off" unicode="&#xf131;" horiz-adv-x="1408" 
+d="M271 591l-101 -101q-42 103 -42 214v128q0 26 19 45t45 19t45 -19t19 -45v-128q0 -53 15 -113zM1385 1193l-361 -361v-128q0 -132 -94 -226t-226 -94q-55 0 -109 19l-96 -96q97 -51 205 -51q185 0 316.5 131.5t131.5 316.5v128q0 26 19 45t45 19t45 -19t19 -45v-128
+q0 -221 -147.5 -384.5t-364.5 -187.5v-132h256q26 0 45 -19t19 -45t-19 -45t-45 -19h-640q-26 0 -45 19t-19 45t19 45t45 19h256v132q-125 13 -235 81l-254 -254q-10 -10 -23 -10t-23 10l-82 82q-10 10 -10 23t10 23l1234 1234q10 10 23 10t23 -10l82 -82q10 -10 10 -23
+t-10 -23zM1005 1325l-621 -621v512q0 132 94 226t226 94q102 0 184.5 -59t116.5 -152z" />
+    <glyph glyph-name="shield" unicode="&#xf132;" horiz-adv-x="1280" 
+d="M1088 576v640h-448v-1137q119 63 213 137q235 184 235 360zM1280 1344v-768q0 -86 -33.5 -170.5t-83 -150t-118 -127.5t-126.5 -103t-121 -77.5t-89.5 -49.5t-42.5 -20q-12 -6 -26 -6t-26 6q-16 7 -42.5 20t-89.5 49.5t-121 77.5t-126.5 103t-118 127.5t-83 150
+t-33.5 170.5v768q0 26 19 45t45 19h1152q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="calendar_empty" unicode="&#xf133;" horiz-adv-x="1664" 
+d="M128 -128h1408v1024h-1408v-1024zM512 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1280 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1664 1152v-1280
+q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h384v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h128q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="fire_extinguisher" unicode="&#xf134;" horiz-adv-x="1408" 
+d="M512 1344q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1408 1376v-320q0 -16 -12 -25q-8 -7 -20 -7q-4 0 -7 1l-448 96q-11 2 -18 11t-7 20h-256v-102q111 -23 183.5 -111t72.5 -203v-800q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v800
+q0 106 62.5 190.5t161.5 114.5v111h-32q-59 0 -115 -23.5t-91.5 -53t-66 -66.5t-40.5 -53.5t-14 -24.5q-17 -35 -57 -35q-16 0 -29 7q-23 12 -31.5 37t3.5 49q5 10 14.5 26t37.5 53.5t60.5 70t85 67t108.5 52.5q-25 42 -25 86q0 66 47 113t113 47t113 -47t47 -113
+q0 -33 -14 -64h302q0 11 7 20t18 11l448 96q3 1 7 1q12 0 20 -7q12 -9 12 -25z" />
+    <glyph glyph-name="rocket" unicode="&#xf135;" horiz-adv-x="1664" 
+d="M1440 1088q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM1664 1376q0 -249 -75.5 -430.5t-253.5 -360.5q-81 -80 -195 -176l-20 -379q-2 -16 -16 -26l-384 -224q-7 -4 -16 -4q-12 0 -23 9l-64 64q-13 14 -8 32l85 276l-281 281l-276 -85q-3 -1 -9 -1
+q-14 0 -23 9l-64 64q-17 19 -5 39l224 384q10 14 26 16l379 20q96 114 176 195q188 187 358 258t431 71q14 0 24 -9.5t10 -22.5z" />
+    <glyph glyph-name="maxcdn" unicode="&#xf136;" horiz-adv-x="1792" 
+d="M1745 763l-164 -763h-334l178 832q13 56 -15 88q-27 33 -83 33h-169l-204 -953h-334l204 953h-286l-204 -953h-334l204 953l-153 327h1276q101 0 189.5 -40.5t147.5 -113.5q60 -73 81 -168.5t0 -194.5z" />
+    <glyph glyph-name="chevron_sign_left" unicode="&#xf137;" 
+d="M909 141l102 102q19 19 19 45t-19 45l-307 307l307 307q19 19 19 45t-19 45l-102 102q-19 19 -45 19t-45 -19l-454 -454q-19 -19 -19 -45t19 -45l454 -454q19 -19 45 -19t45 19zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5
+t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="chevron_sign_right" unicode="&#xf138;" 
+d="M717 141l454 454q19 19 19 45t-19 45l-454 454q-19 19 -45 19t-45 -19l-102 -102q-19 -19 -19 -45t19 -45l307 -307l-307 -307q-19 -19 -19 -45t19 -45l102 -102q19 -19 45 -19t45 19zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5
+t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="chevron_sign_up" unicode="&#xf139;" 
+d="M1165 397l102 102q19 19 19 45t-19 45l-454 454q-19 19 -45 19t-45 -19l-454 -454q-19 -19 -19 -45t19 -45l102 -102q19 -19 45 -19t45 19l307 307l307 -307q19 -19 45 -19t45 19zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5
+t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="chevron_sign_down" unicode="&#xf13a;" 
+d="M813 237l454 454q19 19 19 45t-19 45l-102 102q-19 19 -45 19t-45 -19l-307 -307l-307 307q-19 19 -45 19t-45 -19l-102 -102q-19 -19 -19 -45t19 -45l454 -454q19 -19 45 -19t45 19zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5
+t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="html5" unicode="&#xf13b;" horiz-adv-x="1408" 
+d="M1130 939l16 175h-884l47 -534h612l-22 -228l-197 -53l-196 53l-13 140h-175l22 -278l362 -100h4v1l359 99l50 544h-644l-15 181h674zM0 1408h1408l-128 -1438l-578 -162l-574 162z" />
+    <glyph glyph-name="css3" unicode="&#xf13c;" horiz-adv-x="1792" 
+d="M275 1408h1505l-266 -1333l-804 -267l-698 267l71 356h297l-29 -147l422 -161l486 161l68 339h-1208l58 297h1209l38 191h-1208z" />
+    <glyph glyph-name="anchor" unicode="&#xf13d;" horiz-adv-x="1792" 
+d="M960 1280q0 26 -19 45t-45 19t-45 -19t-19 -45t19 -45t45 -19t45 19t19 45zM1792 352v-352q0 -22 -20 -30q-8 -2 -12 -2q-12 0 -23 9l-93 93q-119 -143 -318.5 -226.5t-429.5 -83.5t-429.5 83.5t-318.5 226.5l-93 -93q-9 -9 -23 -9q-4 0 -12 2q-20 8 -20 30v352
+q0 14 9 23t23 9h352q22 0 30 -20q8 -19 -7 -35l-100 -100q67 -91 189.5 -153.5t271.5 -82.5v647h-192q-26 0 -45 19t-19 45v128q0 26 19 45t45 19h192v163q-58 34 -93 92.5t-35 128.5q0 106 75 181t181 75t181 -75t75 -181q0 -70 -35 -128.5t-93 -92.5v-163h192q26 0 45 -19
+t19 -45v-128q0 -26 -19 -45t-45 -19h-192v-647q149 20 271.5 82.5t189.5 153.5l-100 100q-15 16 -7 35q8 20 30 20h352q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="unlock_alt" unicode="&#xf13e;" horiz-adv-x="1152" 
+d="M1056 768q40 0 68 -28t28 -68v-576q0 -40 -28 -68t-68 -28h-960q-40 0 -68 28t-28 68v576q0 40 28 68t68 28h32v320q0 185 131.5 316.5t316.5 131.5t316.5 -131.5t131.5 -316.5q0 -26 -19 -45t-45 -19h-64q-26 0 -45 19t-19 45q0 106 -75 181t-181 75t-181 -75t-75 -181
+v-320h736z" />
+    <glyph glyph-name="bullseye" unicode="&#xf140;" 
+d="M1024 640q0 -106 -75 -181t-181 -75t-181 75t-75 181t75 181t181 75t181 -75t75 -181zM1152 640q0 159 -112.5 271.5t-271.5 112.5t-271.5 -112.5t-112.5 -271.5t112.5 -271.5t271.5 -112.5t271.5 112.5t112.5 271.5zM1280 640q0 -212 -150 -362t-362 -150t-362 150
+t-150 362t150 362t362 150t362 -150t150 -362zM1408 640q0 130 -51 248.5t-136.5 204t-204 136.5t-248.5 51t-248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5zM1536 640
+q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="ellipsis_horizontal" unicode="&#xf141;" horiz-adv-x="1408" 
+d="M384 800v-192q0 -40 -28 -68t-68 -28h-192q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68zM896 800v-192q0 -40 -28 -68t-68 -28h-192q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68zM1408 800v-192q0 -40 -28 -68t-68 -28h-192
+q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="ellipsis_vertical" unicode="&#xf142;" horiz-adv-x="384" 
+d="M384 288v-192q0 -40 -28 -68t-68 -28h-192q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68zM384 800v-192q0 -40 -28 -68t-68 -28h-192q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68zM384 1312v-192q0 -40 -28 -68t-68 -28h-192
+q-40 0 -68 28t-28 68v192q0 40 28 68t68 28h192q40 0 68 -28t28 -68z" />
+    <glyph glyph-name="_303" unicode="&#xf143;" 
+d="M512 256q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM863 162q-13 233 -176.5 396.5t-396.5 176.5q-14 1 -24 -9t-10 -23v-128q0 -13 8.5 -22t21.5 -10q154 -11 264 -121t121 -264q1 -13 10 -21.5t22 -8.5h128
+q13 0 23 10t9 24zM1247 161q-5 154 -56 297.5t-139.5 260t-205 205t-260 139.5t-297.5 56q-14 1 -23 -9q-10 -10 -10 -23v-128q0 -13 9 -22t22 -10q204 -7 378 -111.5t278.5 -278.5t111.5 -378q1 -13 10 -22t22 -9h128q13 0 23 10q11 9 9 23zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="play_sign" unicode="&#xf144;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM1152 585q32 18 32 55t-32 55l-544 320q-31 19 -64 1q-32 -19 -32 -56v-640q0 -37 32 -56
+q16 -8 32 -8q17 0 32 9z" />
+    <glyph glyph-name="ticket" unicode="&#xf145;" horiz-adv-x="1792" 
+d="M1024 1084l316 -316l-572 -572l-316 316zM813 105l618 618q19 19 19 45t-19 45l-362 362q-18 18 -45 18t-45 -18l-618 -618q-19 -19 -19 -45t19 -45l362 -362q18 -18 45 -18t45 18zM1702 742l-907 -908q-37 -37 -90.5 -37t-90.5 37l-126 126q56 56 56 136t-56 136
+t-136 56t-136 -56l-125 126q-37 37 -37 90.5t37 90.5l907 906q37 37 90.5 37t90.5 -37l125 -125q-56 -56 -56 -136t56 -136t136 -56t136 56l126 -125q37 -37 37 -90.5t-37 -90.5z" />
+    <glyph glyph-name="minus_sign_alt" unicode="&#xf146;" 
+d="M1280 576v128q0 26 -19 45t-45 19h-896q-26 0 -45 -19t-19 -45v-128q0 -26 19 -45t45 -19h896q26 0 45 19t19 45zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5
+t84.5 -203.5z" />
+    <glyph glyph-name="check_minus" unicode="&#xf147;" horiz-adv-x="1408" 
+d="M1152 736v-64q0 -14 -9 -23t-23 -9h-832q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h832q14 0 23 -9t9 -23zM1280 288v832q0 66 -47 113t-113 47h-832q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832q66 0 113 47t47 113zM1408 1120v-832q0 -119 -84.5 -203.5
+t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h832q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="level_up" unicode="&#xf148;" horiz-adv-x="1024" 
+d="M1018 933q-18 -37 -58 -37h-192v-864q0 -14 -9 -23t-23 -9h-704q-21 0 -29 18q-8 20 4 35l160 192q9 11 25 11h320v640h-192q-40 0 -58 37q-17 37 9 68l320 384q18 22 49 22t49 -22l320 -384q27 -32 9 -68z" />
+    <glyph glyph-name="level_down" unicode="&#xf149;" horiz-adv-x="1024" 
+d="M32 1280h704q13 0 22.5 -9.5t9.5 -23.5v-863h192q40 0 58 -37t-9 -69l-320 -384q-18 -22 -49 -22t-49 22l-320 384q-26 31 -9 69q18 37 58 37h192v640h-320q-14 0 -25 11l-160 192q-13 14 -4 34q9 19 29 19z" />
+    <glyph glyph-name="check_sign" unicode="&#xf14a;" 
+d="M685 237l614 614q19 19 19 45t-19 45l-102 102q-19 19 -45 19t-45 -19l-467 -467l-211 211q-19 19 -45 19t-45 -19l-102 -102q-19 -19 -19 -45t19 -45l358 -358q19 -19 45 -19t45 19zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5
+t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="edit_sign" unicode="&#xf14b;" 
+d="M404 428l152 -152l-52 -52h-56v96h-96v56zM818 818q14 -13 -3 -30l-291 -291q-17 -17 -30 -3q-14 13 3 30l291 291q17 17 30 3zM544 128l544 544l-288 288l-544 -544v-288h288zM1152 736l92 92q28 28 28 68t-28 68l-152 152q-28 28 -68 28t-68 -28l-92 -92zM1536 1120
+v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_312" unicode="&#xf14c;" 
+d="M1280 608v480q0 26 -19 45t-45 19h-480q-42 0 -59 -39q-17 -41 14 -70l144 -144l-534 -534q-19 -19 -19 -45t19 -45l102 -102q19 -19 45 -19t45 19l534 534l144 -144q18 -19 45 -19q12 0 25 5q39 17 39 59zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960
+q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="share_sign" unicode="&#xf14d;" 
+d="M1005 435l352 352q19 19 19 45t-19 45l-352 352q-30 31 -69 14q-40 -17 -40 -59v-160q-119 0 -216 -19.5t-162.5 -51t-114 -79t-76.5 -95.5t-44.5 -109t-21.5 -111.5t-5 -110.5q0 -181 167 -404q11 -12 25 -12q7 0 13 3q22 9 19 33q-44 354 62 473q46 52 130 75.5
+t224 23.5v-160q0 -42 40 -59q12 -5 24 -5q26 0 45 19zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="compass" unicode="&#xf14e;" 
+d="M640 448l256 128l-256 128v-256zM1024 1039v-542l-512 -256v542zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103
+t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="collapse" unicode="&#xf150;" 
+d="M1145 861q18 -35 -5 -66l-320 -448q-19 -27 -52 -27t-52 27l-320 448q-23 31 -5 66q17 35 57 35h640q40 0 57 -35zM1280 160v960q0 13 -9.5 22.5t-22.5 9.5h-960q-13 0 -22.5 -9.5t-9.5 -22.5v-960q0 -13 9.5 -22.5t22.5 -9.5h960q13 0 22.5 9.5t9.5 22.5zM1536 1120
+v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="collapse_top" unicode="&#xf151;" 
+d="M1145 419q-17 -35 -57 -35h-640q-40 0 -57 35q-18 35 5 66l320 448q19 27 52 27t52 -27l320 -448q23 -31 5 -66zM1280 160v960q0 13 -9.5 22.5t-22.5 9.5h-960q-13 0 -22.5 -9.5t-9.5 -22.5v-960q0 -13 9.5 -22.5t22.5 -9.5h960q13 0 22.5 9.5t9.5 22.5zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_317" unicode="&#xf152;" 
+d="M1088 640q0 -33 -27 -52l-448 -320q-31 -23 -66 -5q-35 17 -35 57v640q0 40 35 57q35 18 66 -5l448 -320q27 -19 27 -52zM1280 160v960q0 14 -9 23t-23 9h-960q-14 0 -23 -9t-9 -23v-960q0 -14 9 -23t23 -9h960q14 0 23 9t9 23zM1536 1120v-960q0 -119 -84.5 -203.5
+t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="eur" unicode="&#xf153;" horiz-adv-x="1024" 
+d="M976 229l35 -159q3 -12 -3 -22.5t-17 -14.5l-5 -1q-4 -2 -10.5 -3.5t-16 -4.5t-21.5 -5.5t-25.5 -5t-30 -5t-33.5 -4.5t-36.5 -3t-38.5 -1q-234 0 -409 130.5t-238 351.5h-95q-13 0 -22.5 9.5t-9.5 22.5v113q0 13 9.5 22.5t22.5 9.5h66q-2 57 1 105h-67q-14 0 -23 9
+t-9 23v114q0 14 9 23t23 9h98q67 210 243.5 338t400.5 128q102 0 194 -23q11 -3 20 -15q6 -11 3 -24l-43 -159q-3 -13 -14 -19.5t-24 -2.5l-4 1q-4 1 -11.5 2.5l-17.5 3.5t-22.5 3.5t-26 3t-29 2.5t-29.5 1q-126 0 -226 -64t-150 -176h468q16 0 25 -12q10 -12 7 -26
+l-24 -114q-5 -26 -32 -26h-488q-3 -37 0 -105h459q15 0 25 -12q9 -12 6 -27l-24 -112q-2 -11 -11 -18.5t-20 -7.5h-387q48 -117 149.5 -185.5t228.5 -68.5q18 0 36 1.5t33.5 3.5t29.5 4.5t24.5 5t18.5 4.5l12 3l5 2q13 5 26 -2q12 -7 15 -21z" />
+    <glyph glyph-name="gbp" unicode="&#xf154;" horiz-adv-x="1024" 
+d="M1020 399v-367q0 -14 -9 -23t-23 -9h-956q-14 0 -23 9t-9 23v150q0 13 9.5 22.5t22.5 9.5h97v383h-95q-14 0 -23 9.5t-9 22.5v131q0 14 9 23t23 9h95v223q0 171 123.5 282t314.5 111q185 0 335 -125q9 -8 10 -20.5t-7 -22.5l-103 -127q-9 -11 -22 -12q-13 -2 -23 7
+q-5 5 -26 19t-69 32t-93 18q-85 0 -137 -47t-52 -123v-215h305q13 0 22.5 -9t9.5 -23v-131q0 -13 -9.5 -22.5t-22.5 -9.5h-305v-379h414v181q0 13 9 22.5t23 9.5h162q14 0 23 -9.5t9 -22.5z" />
+    <glyph glyph-name="usd" unicode="&#xf155;" horiz-adv-x="1024" 
+d="M978 351q0 -153 -99.5 -263.5t-258.5 -136.5v-175q0 -14 -9 -23t-23 -9h-135q-13 0 -22.5 9.5t-9.5 22.5v175q-66 9 -127.5 31t-101.5 44.5t-74 48t-46.5 37.5t-17.5 18q-17 21 -2 41l103 135q7 10 23 12q15 2 24 -9l2 -2q113 -99 243 -125q37 -8 74 -8q81 0 142.5 43
+t61.5 122q0 28 -15 53t-33.5 42t-58.5 37.5t-66 32t-80 32.5q-39 16 -61.5 25t-61.5 26.5t-62.5 31t-56.5 35.5t-53.5 42.5t-43.5 49t-35.5 58t-21 66.5t-8.5 78q0 138 98 242t255 134v180q0 13 9.5 22.5t22.5 9.5h135q14 0 23 -9t9 -23v-176q57 -6 110.5 -23t87 -33.5
+t63.5 -37.5t39 -29t15 -14q17 -18 5 -38l-81 -146q-8 -15 -23 -16q-14 -3 -27 7q-3 3 -14.5 12t-39 26.5t-58.5 32t-74.5 26t-85.5 11.5q-95 0 -155 -43t-60 -111q0 -26 8.5 -48t29.5 -41.5t39.5 -33t56 -31t60.5 -27t70 -27.5q53 -20 81 -31.5t76 -35t75.5 -42.5t62 -50
+t53 -63.5t31.5 -76.5t13 -94z" />
+    <glyph glyph-name="inr" unicode="&#xf156;" horiz-adv-x="898" 
+d="M898 1066v-102q0 -14 -9 -23t-23 -9h-168q-23 -144 -129 -234t-276 -110q167 -178 459 -536q14 -16 4 -34q-8 -18 -29 -18h-195q-16 0 -25 12q-306 367 -498 571q-9 9 -9 22v127q0 13 9.5 22.5t22.5 9.5h112q132 0 212.5 43t102.5 125h-427q-14 0 -23 9t-9 23v102
+q0 14 9 23t23 9h413q-57 113 -268 113h-145q-13 0 -22.5 9.5t-9.5 22.5v133q0 14 9 23t23 9h832q14 0 23 -9t9 -23v-102q0 -14 -9 -23t-23 -9h-233q47 -61 64 -144h171q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="jpy" unicode="&#xf157;" horiz-adv-x="1027" 
+d="M603 0h-172q-13 0 -22.5 9t-9.5 23v330h-288q-13 0 -22.5 9t-9.5 23v103q0 13 9.5 22.5t22.5 9.5h288v85h-288q-13 0 -22.5 9t-9.5 23v104q0 13 9.5 22.5t22.5 9.5h214l-321 578q-8 16 0 32q10 16 28 16h194q19 0 29 -18l215 -425q19 -38 56 -125q10 24 30.5 68t27.5 61
+l191 420q8 19 29 19h191q17 0 27 -16q9 -14 1 -31l-313 -579h215q13 0 22.5 -9.5t9.5 -22.5v-104q0 -14 -9.5 -23t-22.5 -9h-290v-85h290q13 0 22.5 -9.5t9.5 -22.5v-103q0 -14 -9.5 -23t-22.5 -9h-290v-330q0 -13 -9.5 -22.5t-22.5 -9.5z" />
+    <glyph glyph-name="rub" unicode="&#xf158;" horiz-adv-x="1280" 
+d="M1043 971q0 100 -65 162t-171 62h-320v-448h320q106 0 171 62t65 162zM1280 971q0 -193 -126.5 -315t-326.5 -122h-340v-118h505q14 0 23 -9t9 -23v-128q0 -14 -9 -23t-23 -9h-505v-192q0 -14 -9.5 -23t-22.5 -9h-167q-14 0 -23 9t-9 23v192h-224q-14 0 -23 9t-9 23v128
+q0 14 9 23t23 9h224v118h-224q-14 0 -23 9t-9 23v149q0 13 9 22.5t23 9.5h224v629q0 14 9 23t23 9h539q200 0 326.5 -122t126.5 -315z" />
+    <glyph glyph-name="krw" unicode="&#xf159;" horiz-adv-x="1792" 
+d="M514 341l81 299h-159l75 -300q1 -1 1 -3t1 -3q0 1 0.5 3.5t0.5 3.5zM630 768l35 128h-292l32 -128h225zM822 768h139l-35 128h-70zM1271 340l78 300h-162l81 -299q0 -1 0.5 -3.5t1.5 -3.5q0 1 0.5 3t0.5 3zM1382 768l33 128h-297l34 -128h230zM1792 736v-64q0 -14 -9 -23
+t-23 -9h-213l-164 -616q-7 -24 -31 -24h-159q-24 0 -31 24l-166 616h-209l-167 -616q-7 -24 -31 -24h-159q-11 0 -19.5 7t-10.5 17l-160 616h-208q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h175l-33 128h-142q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h109l-89 344q-5 15 5 28
+q10 12 26 12h137q26 0 31 -24l90 -360h359l97 360q7 24 31 24h126q24 0 31 -24l98 -360h365l93 360q5 24 31 24h137q16 0 26 -12q10 -13 5 -28l-91 -344h111q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-145l-34 -128h179q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="btc" unicode="&#xf15a;" horiz-adv-x="1280" 
+d="M1167 896q18 -182 -131 -258q117 -28 175 -103t45 -214q-7 -71 -32.5 -125t-64.5 -89t-97 -58.5t-121.5 -34.5t-145.5 -15v-255h-154v251q-80 0 -122 1v-252h-154v255q-18 0 -54 0.5t-55 0.5h-200l31 183h111q50 0 58 51v402h16q-6 1 -16 1v287q-13 68 -89 68h-111v164
+l212 -1q64 0 97 1v252h154v-247q82 2 122 2v245h154v-252q79 -7 140 -22.5t113 -45t82.5 -78t36.5 -114.5zM952 351q0 36 -15 64t-37 46t-57.5 30.5t-65.5 18.5t-74 9t-69 3t-64.5 -1t-47.5 -1v-338q8 0 37 -0.5t48 -0.5t53 1.5t58.5 4t57 8.5t55.5 14t47.5 21t39.5 30
+t24.5 40t9.5 51zM881 827q0 33 -12.5 58.5t-30.5 42t-48 28t-55 16.5t-61.5 8t-58 2.5t-54 -1t-39.5 -0.5v-307q5 0 34.5 -0.5t46.5 0t50 2t55 5.5t51.5 11t48.5 18.5t37 27t27 38.5t9 51z" />
+    <glyph glyph-name="file" unicode="&#xf15b;" 
+d="M1024 1024v472q22 -14 36 -28l408 -408q14 -14 28 -36h-472zM896 992q0 -40 28 -68t68 -28h544v-1056q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h800v-544z" />
+    <glyph glyph-name="file_text" unicode="&#xf15c;" 
+d="M1468 1060q14 -14 28 -36h-472v472q22 -14 36 -28zM992 896h544v-1056q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h800v-544q0 -40 28 -68t68 -28zM1152 160v64q0 14 -9 23t-23 9h-704q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h704
+q14 0 23 9t9 23zM1152 416v64q0 14 -9 23t-23 9h-704q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h704q14 0 23 9t9 23zM1152 672v64q0 14 -9 23t-23 9h-704q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h704q14 0 23 9t9 23z" />
+    <glyph glyph-name="sort_by_alphabet" unicode="&#xf15d;" horiz-adv-x="1664" 
+d="M1191 1128h177l-72 218l-12 47q-2 16 -2 20h-4l-3 -20q0 -1 -3.5 -18t-7.5 -29zM736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192q14 0 23 -9t9 -23zM1572 -23
+v-233h-584v90l369 529q12 18 21 27l11 9v3q-2 0 -6.5 -0.5t-7.5 -0.5q-12 -3 -30 -3h-232v-115h-120v229h567v-89l-369 -530q-6 -8 -21 -26l-11 -11v-2l14 2q9 2 30 2h248v119h121zM1661 874v-106h-288v106h75l-47 144h-243l-47 -144h75v-106h-287v106h70l230 662h162
+l230 -662h70z" />
+    <glyph glyph-name="_329" unicode="&#xf15e;" horiz-adv-x="1664" 
+d="M1191 104h177l-72 218l-12 47q-2 16 -2 20h-4l-3 -20q0 -1 -3.5 -18t-7.5 -29zM736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192q14 0 23 -9t9 -23zM1661 -150
+v-106h-288v106h75l-47 144h-243l-47 -144h75v-106h-287v106h70l230 662h162l230 -662h70zM1572 1001v-233h-584v90l369 529q12 18 21 27l11 9v3q-2 0 -6.5 -0.5t-7.5 -0.5q-12 -3 -30 -3h-232v-115h-120v229h567v-89l-369 -530q-6 -8 -21 -26l-11 -10v-3l14 3q9 1 30 1h248
+v119h121z" />
+    <glyph glyph-name="sort_by_attributes" unicode="&#xf160;" horiz-adv-x="1792" 
+d="M736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192q14 0 23 -9t9 -23zM1792 -32v-192q0 -14 -9 -23t-23 -9h-832q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h832
+q14 0 23 -9t9 -23zM1600 480v-192q0 -14 -9 -23t-23 -9h-640q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h640q14 0 23 -9t9 -23zM1408 992v-192q0 -14 -9 -23t-23 -9h-448q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h448q14 0 23 -9t9 -23zM1216 1504v-192q0 -14 -9 -23t-23 -9h-256
+q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h256q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="sort_by_attributes_alt" unicode="&#xf161;" horiz-adv-x="1792" 
+d="M1216 -32v-192q0 -14 -9 -23t-23 -9h-256q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h256q14 0 23 -9t9 -23zM736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192
+q14 0 23 -9t9 -23zM1408 480v-192q0 -14 -9 -23t-23 -9h-448q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h448q14 0 23 -9t9 -23zM1600 992v-192q0 -14 -9 -23t-23 -9h-640q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h640q14 0 23 -9t9 -23zM1792 1504v-192q0 -14 -9 -23t-23 -9h-832
+q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h832q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="sort_by_order" unicode="&#xf162;" 
+d="M1346 223q0 63 -44 116t-103 53q-52 0 -83 -37t-31 -94t36.5 -95t104.5 -38q50 0 85 27t35 68zM736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192q14 0 23 -9t9 -23
+zM1486 165q0 -62 -13 -121.5t-41 -114t-68 -95.5t-98.5 -65.5t-127.5 -24.5q-62 0 -108 16q-24 8 -42 15l39 113q15 -7 31 -11q37 -13 75 -13q84 0 134.5 58.5t66.5 145.5h-2q-21 -23 -61.5 -37t-84.5 -14q-106 0 -173 71.5t-67 172.5q0 105 72 178t181 73q123 0 205 -94.5
+t82 -252.5zM1456 882v-114h-469v114h167v432q0 7 0.5 19t0.5 17v16h-2l-7 -12q-8 -13 -26 -31l-62 -58l-82 86l192 185h123v-654h165z" />
+    <glyph glyph-name="sort_by_order_alt" unicode="&#xf163;" 
+d="M1346 1247q0 63 -44 116t-103 53q-52 0 -83 -37t-31 -94t36.5 -95t104.5 -38q50 0 85 27t35 68zM736 96q0 -12 -10 -24l-319 -319q-10 -9 -23 -9q-12 0 -23 9l-320 320q-15 16 -7 35q8 20 30 20h192v1376q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1376h192q14 0 23 -9
+t9 -23zM1456 -142v-114h-469v114h167v432q0 7 0.5 19t0.5 17v16h-2l-7 -12q-8 -13 -26 -31l-62 -58l-82 86l192 185h123v-654h165zM1486 1189q0 -62 -13 -121.5t-41 -114t-68 -95.5t-98.5 -65.5t-127.5 -24.5q-62 0 -108 16q-24 8 -42 15l39 113q15 -7 31 -11q37 -13 75 -13
+q84 0 134.5 58.5t66.5 145.5h-2q-21 -23 -61.5 -37t-84.5 -14q-106 0 -173 71.5t-67 172.5q0 105 72 178t181 73q123 0 205 -94.5t82 -252.5z" />
+    <glyph glyph-name="_334" unicode="&#xf164;" horiz-adv-x="1664" 
+d="M256 192q0 26 -19 45t-45 19q-27 0 -45.5 -19t-18.5 -45q0 -27 18.5 -45.5t45.5 -18.5q26 0 45 18.5t19 45.5zM416 704v-640q0 -26 -19 -45t-45 -19h-288q-26 0 -45 19t-19 45v640q0 26 19 45t45 19h288q26 0 45 -19t19 -45zM1600 704q0 -86 -55 -149q15 -44 15 -76
+q3 -76 -43 -137q17 -56 0 -117q-15 -57 -54 -94q9 -112 -49 -181q-64 -76 -197 -78h-36h-76h-17q-66 0 -144 15.5t-121.5 29t-120.5 39.5q-123 43 -158 44q-26 1 -45 19.5t-19 44.5v641q0 25 18 43.5t43 20.5q24 2 76 59t101 121q68 87 101 120q18 18 31 48t17.5 48.5
+t13.5 60.5q7 39 12.5 61t19.5 52t34 50q19 19 45 19q46 0 82.5 -10.5t60 -26t40 -40.5t24 -45t12 -50t5 -45t0.5 -39q0 -38 -9.5 -76t-19 -60t-27.5 -56q-3 -6 -10 -18t-11 -22t-8 -24h277q78 0 135 -57t57 -135z" />
+    <glyph glyph-name="_335" unicode="&#xf165;" horiz-adv-x="1664" 
+d="M256 960q0 -26 -19 -45t-45 -19q-27 0 -45.5 19t-18.5 45q0 27 18.5 45.5t45.5 18.5q26 0 45 -18.5t19 -45.5zM416 448v640q0 26 -19 45t-45 19h-288q-26 0 -45 -19t-19 -45v-640q0 -26 19 -45t45 -19h288q26 0 45 19t19 45zM1545 597q55 -61 55 -149q-1 -78 -57.5 -135
+t-134.5 -57h-277q4 -14 8 -24t11 -22t10 -18q18 -37 27 -57t19 -58.5t10 -76.5q0 -24 -0.5 -39t-5 -45t-12 -50t-24 -45t-40 -40.5t-60 -26t-82.5 -10.5q-26 0 -45 19q-20 20 -34 50t-19.5 52t-12.5 61q-9 42 -13.5 60.5t-17.5 48.5t-31 48q-33 33 -101 120q-49 64 -101 121
+t-76 59q-25 2 -43 20.5t-18 43.5v641q0 26 19 44.5t45 19.5q35 1 158 44q77 26 120.5 39.5t121.5 29t144 15.5h17h76h36q133 -2 197 -78q58 -69 49 -181q39 -37 54 -94q17 -61 0 -117q46 -61 43 -137q0 -32 -15 -76z" />
+    <glyph glyph-name="youtube_sign" unicode="&#xf166;" 
+d="M919 233v157q0 50 -29 50q-17 0 -33 -16v-224q16 -16 33 -16q29 0 29 49zM1103 355h66v34q0 51 -33 51t-33 -51v-34zM532 621v-70h-80v-423h-74v423h-78v70h232zM733 495v-367h-67v40q-39 -45 -76 -45q-33 0 -42 28q-6 17 -6 54v290h66v-270q0 -24 1 -26q1 -15 15 -15
+q20 0 42 31v280h67zM985 384v-146q0 -52 -7 -73q-12 -42 -53 -42q-35 0 -68 41v-36h-67v493h67v-161q32 40 68 40q41 0 53 -42q7 -21 7 -74zM1236 255v-9q0 -29 -2 -43q-3 -22 -15 -40q-27 -40 -80 -40q-52 0 -81 38q-21 27 -21 86v129q0 59 20 86q29 38 80 38t78 -38
+q21 -29 21 -86v-76h-133v-65q0 -51 34 -51q24 0 30 26q0 1 0.5 7t0.5 16.5v21.5h68zM785 1079v-156q0 -51 -32 -51t-32 51v156q0 52 32 52t32 -52zM1318 366q0 177 -19 260q-10 44 -43 73.5t-76 34.5q-136 15 -412 15q-275 0 -411 -15q-44 -5 -76.5 -34.5t-42.5 -73.5
+q-20 -87 -20 -260q0 -176 20 -260q10 -43 42.5 -73t75.5 -35q137 -15 412 -15t412 15q43 5 75.5 35t42.5 73q20 84 20 260zM563 1017l90 296h-75l-51 -195l-53 195h-78q7 -23 23 -69l24 -69q35 -103 46 -158v-201h74v201zM852 936v130q0 58 -21 87q-29 38 -78 38
+q-51 0 -78 -38q-21 -29 -21 -87v-130q0 -58 21 -87q27 -38 78 -38q49 0 78 38q21 27 21 87zM1033 816h67v370h-67v-283q-22 -31 -42 -31q-15 0 -16 16q-1 2 -1 26v272h-67v-293q0 -37 6 -55q11 -27 43 -27q36 0 77 45v-40zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5
+h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="youtube" unicode="&#xf167;" 
+d="M971 292v-211q0 -67 -39 -67q-23 0 -45 22v301q22 22 45 22q39 0 39 -67zM1309 291v-46h-90v46q0 68 45 68t45 -68zM343 509h107v94h-312v-94h105v-569h100v569zM631 -60h89v494h-89v-378q-30 -42 -57 -42q-18 0 -21 21q-1 3 -1 35v364h-89v-391q0 -49 8 -73
+q12 -37 58 -37q48 0 102 61v-54zM1060 88v197q0 73 -9 99q-17 56 -71 56q-50 0 -93 -54v217h-89v-663h89v48q45 -55 93 -55q54 0 71 55q9 27 9 100zM1398 98v13h-91q0 -51 -2 -61q-7 -36 -40 -36q-46 0 -46 69v87h179v103q0 79 -27 116q-39 51 -106 51q-68 0 -107 -51
+q-28 -37 -28 -116v-173q0 -79 29 -116q39 -51 108 -51q72 0 108 53q18 27 21 54q2 9 2 58zM790 1011v210q0 69 -43 69t-43 -69v-210q0 -70 43 -70t43 70zM1509 260q0 -234 -26 -350q-14 -59 -58 -99t-102 -46q-184 -21 -555 -21t-555 21q-58 6 -102.5 46t-57.5 99
+q-26 112 -26 350q0 234 26 350q14 59 58 99t103 47q183 20 554 20t555 -20q58 -7 102.5 -47t57.5 -99q26 -112 26 -350zM511 1536h102l-121 -399v-271h-100v271q-14 74 -61 212q-37 103 -65 187h106l71 -263zM881 1203v-175q0 -81 -28 -118q-38 -51 -106 -51q-67 0 -105 51
+q-28 38 -28 118v175q0 80 28 117q38 51 105 51q68 0 106 -51q28 -37 28 -117zM1216 1365v-499h-91v55q-53 -62 -103 -62q-46 0 -59 37q-8 24 -8 75v394h91v-367q0 -33 1 -35q3 -22 21 -22q27 0 57 43v381h91z" />
+    <glyph glyph-name="xing" unicode="&#xf168;" horiz-adv-x="1408" 
+d="M597 869q-10 -18 -257 -456q-27 -46 -65 -46h-239q-21 0 -31 17t0 36l253 448q1 0 0 1l-161 279q-12 22 -1 37q9 15 32 15h239q40 0 66 -45zM1403 1511q11 -16 0 -37l-528 -934v-1l336 -615q11 -20 1 -37q-10 -15 -32 -15h-239q-42 0 -66 45l-339 622q18 32 531 942
+q25 45 64 45h241q22 0 31 -15z" />
+    <glyph glyph-name="xing_sign" unicode="&#xf169;" 
+d="M685 771q0 1 -126 222q-21 34 -52 34h-184q-18 0 -26 -11q-7 -12 1 -29l125 -216v-1l-196 -346q-9 -14 0 -28q8 -13 24 -13h185q31 0 50 36zM1309 1268q-7 12 -24 12h-187q-30 0 -49 -35l-411 -729q1 -2 262 -481q20 -35 52 -35h184q18 0 25 12q8 13 -1 28l-260 476v1
+l409 723q8 16 0 28zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="youtube_play" unicode="&#xf16a;" horiz-adv-x="1792" 
+d="M711 408l484 250l-484 253v-503zM896 1270q168 0 324.5 -4.5t229.5 -9.5l73 -4q1 0 17 -1.5t23 -3t23.5 -4.5t28.5 -8t28 -13t31 -19.5t29 -26.5q6 -6 15.5 -18.5t29 -58.5t26.5 -101q8 -64 12.5 -136.5t5.5 -113.5v-40v-136q1 -145 -18 -290q-7 -55 -25 -99.5t-32 -61.5
+l-14 -17q-14 -15 -29 -26.5t-31 -19t-28 -12.5t-28.5 -8t-24 -4.5t-23 -3t-16.5 -1.5q-251 -19 -627 -19q-207 2 -359.5 6.5t-200.5 7.5l-49 4l-36 4q-36 5 -54.5 10t-51 21t-56.5 41q-6 6 -15.5 18.5t-29 58.5t-26.5 101q-8 64 -12.5 136.5t-5.5 113.5v40v136
+q-1 145 18 290q7 55 25 99.5t32 61.5l14 17q14 15 29 26.5t31 19.5t28 13t28.5 8t23.5 4.5t23 3t17 1.5q251 18 627 18z" />
+    <glyph glyph-name="dropbox" unicode="&#xf16b;" horiz-adv-x="1792" 
+d="M402 829l494 -305l-342 -285l-490 319zM1388 274v-108l-490 -293v-1l-1 1l-1 -1v1l-489 293v108l147 -96l342 284v2l1 -1l1 1v-2l343 -284zM554 1418l342 -285l-494 -304l-338 270zM1390 829l338 -271l-489 -319l-343 285zM1239 1418l489 -319l-338 -270l-494 304z" />
+    <glyph glyph-name="stackexchange" unicode="&#xf16c;" 
+d="M1289 -96h-1118v480h-160v-640h1438v640h-160v-480zM347 428l33 157l783 -165l-33 -156zM450 802l67 146l725 -339l-67 -145zM651 1158l102 123l614 -513l-102 -123zM1048 1536l477 -641l-128 -96l-477 641zM330 65v159h800v-159h-800z" />
+    <glyph glyph-name="instagram" unicode="&#xf16d;" 
+d="M1024 640q0 106 -75 181t-181 75t-181 -75t-75 -181t75 -181t181 -75t181 75t75 181zM1162 640q0 -164 -115 -279t-279 -115t-279 115t-115 279t115 279t279 115t279 -115t115 -279zM1270 1050q0 -38 -27 -65t-65 -27t-65 27t-27 65t27 65t65 27t65 -27t27 -65zM768 1270
+q-7 0 -76.5 0.5t-105.5 0t-96.5 -3t-103 -10t-71.5 -18.5q-50 -20 -88 -58t-58 -88q-11 -29 -18.5 -71.5t-10 -103t-3 -96.5t0 -105.5t0.5 -76.5t-0.5 -76.5t0 -105.5t3 -96.5t10 -103t18.5 -71.5q20 -50 58 -88t88 -58q29 -11 71.5 -18.5t103 -10t96.5 -3t105.5 0t76.5 0.5
+t76.5 -0.5t105.5 0t96.5 3t103 10t71.5 18.5q50 20 88 58t58 88q11 29 18.5 71.5t10 103t3 96.5t0 105.5t-0.5 76.5t0.5 76.5t0 105.5t-3 96.5t-10 103t-18.5 71.5q-20 50 -58 88t-88 58q-29 11 -71.5 18.5t-103 10t-96.5 3t-105.5 0t-76.5 -0.5zM1536 640q0 -229 -5 -317
+q-10 -208 -124 -322t-322 -124q-88 -5 -317 -5t-317 5q-208 10 -322 124t-124 322q-5 88 -5 317t5 317q10 208 124 322t322 124q88 5 317 5t317 -5q208 -10 322 -124t124 -322q5 -88 5 -317z" />
+    <glyph glyph-name="flickr" unicode="&#xf16e;" 
+d="M1248 1408q119 0 203.5 -84.5t84.5 -203.5v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960zM698 640q0 88 -62 150t-150 62t-150 -62t-62 -150t62 -150t150 -62t150 62t62 150zM1262 640q0 88 -62 150
+t-150 62t-150 -62t-62 -150t62 -150t150 -62t150 62t62 150z" />
+    <glyph glyph-name="adn" unicode="&#xf170;" 
+d="M768 914l201 -306h-402zM1133 384h94l-459 691l-459 -691h94l104 160h522zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="f171" unicode="&#xf171;" horiz-adv-x="1408" 
+d="M815 677q8 -63 -50.5 -101t-111.5 -6q-39 17 -53.5 58t-0.5 82t52 58q36 18 72.5 12t64 -35.5t27.5 -67.5zM926 698q-14 107 -113 164t-197 13q-63 -28 -100.5 -88.5t-34.5 -129.5q4 -91 77.5 -155t165.5 -56q91 8 152 84t50 168zM1165 1240q-20 27 -56 44.5t-58 22
+t-71 12.5q-291 47 -566 -2q-43 -7 -66 -12t-55 -22t-50 -43q30 -28 76 -45.5t73.5 -22t87.5 -11.5q228 -29 448 -1q63 8 89.5 12t72.5 21.5t75 46.5zM1222 205q-8 -26 -15.5 -76.5t-14 -84t-28.5 -70t-58 -56.5q-86 -48 -189.5 -71.5t-202 -22t-201.5 18.5q-46 8 -81.5 18
+t-76.5 27t-73 43.5t-52 61.5q-25 96 -57 292l6 16l18 9q223 -148 506.5 -148t507.5 148q21 -6 24 -23t-5 -45t-8 -37zM1403 1166q-26 -167 -111 -655q-5 -30 -27 -56t-43.5 -40t-54.5 -31q-252 -126 -610 -88q-248 27 -394 139q-15 12 -25.5 26.5t-17 35t-9 34t-6 39.5
+t-5.5 35q-9 50 -26.5 150t-28 161.5t-23.5 147.5t-22 158q3 26 17.5 48.5t31.5 37.5t45 30t46 22.5t48 18.5q125 46 313 64q379 37 676 -50q155 -46 215 -122q16 -20 16.5 -51t-5.5 -54z" />
+    <glyph glyph-name="bitbucket_sign" unicode="&#xf172;" 
+d="M848 666q0 43 -41 66t-77 1q-43 -20 -42.5 -72.5t43.5 -70.5q39 -23 81 4t36 72zM928 682q8 -66 -36 -121t-110 -61t-119 40t-56 113q-2 49 25.5 93t72.5 64q70 31 141.5 -10t81.5 -118zM1100 1073q-20 -21 -53.5 -34t-53 -16t-63.5 -8q-155 -20 -324 0q-44 6 -63 9.5
+t-52.5 16t-54.5 32.5q13 19 36 31t40 15.5t47 8.5q198 35 408 1q33 -5 51 -8.5t43 -16t39 -31.5zM1142 327q0 7 5.5 26.5t3 32t-17.5 16.5q-161 -106 -365 -106t-366 106l-12 -6l-5 -12q26 -154 41 -210q47 -81 204 -108q249 -46 428 53q34 19 49 51.5t22.5 85.5t12.5 71z
+M1272 1020q9 53 -8 75q-43 55 -155 88q-216 63 -487 36q-132 -12 -226 -46q-38 -15 -59.5 -25t-47 -34t-29.5 -54q8 -68 19 -138t29 -171t24 -137q1 -5 5 -31t7 -36t12 -27t22 -28q105 -80 284 -100q259 -28 440 63q24 13 39.5 23t31 29t19.5 40q48 267 80 473zM1536 1120
+v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="tumblr" unicode="&#xf173;" horiz-adv-x="1024" 
+d="M944 207l80 -237q-23 -35 -111 -66t-177 -32q-104 -2 -190.5 26t-142.5 74t-95 106t-55.5 120t-16.5 118v544h-168v215q72 26 129 69.5t91 90t58 102t34 99t15 88.5q1 5 4.5 8.5t7.5 3.5h244v-424h333v-252h-334v-518q0 -30 6.5 -56t22.5 -52.5t49.5 -41.5t81.5 -14
+q78 2 134 29z" />
+    <glyph glyph-name="tumblr_sign" unicode="&#xf174;" 
+d="M1136 75l-62 183q-44 -22 -103 -22q-36 -1 -62 10.5t-38.5 31.5t-17.5 40.5t-5 43.5v398h257v194h-256v326h-188q-8 0 -9 -10q-5 -44 -17.5 -87t-39 -95t-77 -95t-118.5 -68v-165h130v-418q0 -57 21.5 -115t65 -111t121 -85.5t176.5 -30.5q69 1 136.5 25t85.5 50z
+M1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="long_arrow_down" unicode="&#xf175;" horiz-adv-x="768" 
+d="M765 237q8 -19 -5 -35l-350 -384q-10 -10 -23 -10q-14 0 -24 10l-355 384q-13 16 -5 35q9 19 29 19h224v1248q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-1248h224q21 0 29 -19z" />
+    <glyph glyph-name="long_arrow_up" unicode="&#xf176;" horiz-adv-x="768" 
+d="M765 1043q-9 -19 -29 -19h-224v-1248q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v1248h-224q-21 0 -29 19t5 35l350 384q10 10 23 10q14 0 24 -10l355 -384q13 -16 5 -35z" />
+    <glyph glyph-name="long_arrow_left" unicode="&#xf177;" horiz-adv-x="1792" 
+d="M1792 736v-192q0 -14 -9 -23t-23 -9h-1248v-224q0 -21 -19 -29t-35 5l-384 350q-10 10 -10 23q0 14 10 24l384 354q16 14 35 6q19 -9 19 -29v-224h1248q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="long_arrow_right" unicode="&#xf178;" horiz-adv-x="1792" 
+d="M1728 643q0 -14 -10 -24l-384 -354q-16 -14 -35 -6q-19 9 -19 29v224h-1248q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h1248v224q0 21 19 29t35 -5l384 -350q10 -10 10 -23z" />
+    <glyph glyph-name="apple" unicode="&#xf179;" horiz-adv-x="1408" 
+d="M1393 321q-39 -125 -123 -250q-129 -196 -257 -196q-49 0 -140 32q-86 32 -151 32q-61 0 -142 -33q-81 -34 -132 -34q-152 0 -301 259q-147 261 -147 503q0 228 113 374q113 144 284 144q72 0 177 -30q104 -30 138 -30q45 0 143 34q102 34 173 34q119 0 213 -65
+q52 -36 104 -100q-79 -67 -114 -118q-65 -94 -65 -207q0 -124 69 -223t158 -126zM1017 1494q0 -61 -29 -136q-30 -75 -93 -138q-54 -54 -108 -72q-37 -11 -104 -17q3 149 78 257q74 107 250 148q1 -3 2.5 -11t2.5 -11q0 -4 0.5 -10t0.5 -10z" />
+    <glyph glyph-name="windows" unicode="&#xf17a;" horiz-adv-x="1664" 
+d="M682 530v-651l-682 94v557h682zM682 1273v-659h-682v565zM1664 530v-786l-907 125v661h907zM1664 1408v-794h-907v669z" />
+    <glyph glyph-name="android" unicode="&#xf17b;" horiz-adv-x="1408" 
+d="M493 1053q16 0 27.5 11.5t11.5 27.5t-11.5 27.5t-27.5 11.5t-27 -11.5t-11 -27.5t11 -27.5t27 -11.5zM915 1053q16 0 27 11.5t11 27.5t-11 27.5t-27 11.5t-27.5 -11.5t-11.5 -27.5t11.5 -27.5t27.5 -11.5zM103 869q42 0 72 -30t30 -72v-430q0 -43 -29.5 -73t-72.5 -30
+t-73 30t-30 73v430q0 42 30 72t73 30zM1163 850v-666q0 -46 -32 -78t-77 -32h-75v-227q0 -43 -30 -73t-73 -30t-73 30t-30 73v227h-138v-227q0 -43 -30 -73t-73 -30q-42 0 -72 30t-30 73l-1 227h-74q-46 0 -78 32t-32 78v666h918zM931 1255q107 -55 171 -153.5t64 -215.5
+h-925q0 117 64 215.5t172 153.5l-71 131q-7 13 5 20q13 6 20 -6l72 -132q95 42 201 42t201 -42l72 132q7 12 20 6q12 -7 5 -20zM1408 767v-430q0 -43 -30 -73t-73 -30q-42 0 -72 30t-30 73v430q0 43 30 72.5t72 29.5q43 0 73 -29.5t30 -72.5z" />
+    <glyph glyph-name="linux" unicode="&#xf17c;" 
+d="M663 1125q-11 -1 -15.5 -10.5t-8.5 -9.5q-5 -1 -5 5q0 12 19 15h10zM750 1111q-4 -1 -11.5 6.5t-17.5 4.5q24 11 32 -2q3 -6 -3 -9zM399 684q-4 1 -6 -3t-4.5 -12.5t-5.5 -13.5t-10 -13q-10 -11 -1 -12q4 -1 12.5 7t12.5 18q1 3 2 7t2 6t1.5 4.5t0.5 4v3t-1 2.5t-3 2z
+M1254 325q0 18 -55 42q4 15 7.5 27.5t5 26t3 21.5t0.5 22.5t-1 19.5t-3.5 22t-4 20.5t-5 25t-5.5 26.5q-10 48 -47 103t-72 75q24 -20 57 -83q87 -162 54 -278q-11 -40 -50 -42q-31 -4 -38.5 18.5t-8 83.5t-11.5 107q-9 39 -19.5 69t-19.5 45.5t-15.5 24.5t-13 15t-7.5 7
+q-14 62 -31 103t-29.5 56t-23.5 33t-15 40q-4 21 6 53.5t4.5 49.5t-44.5 25q-15 3 -44.5 18t-35.5 16q-8 1 -11 26t8 51t36 27q37 3 51 -30t4 -58q-11 -19 -2 -26.5t30 -0.5q13 4 13 36v37q-5 30 -13.5 50t-21 30.5t-23.5 15t-27 7.5q-107 -8 -89 -134q0 -15 -1 -15
+q-9 9 -29.5 10.5t-33 -0.5t-15.5 5q1 57 -16 90t-45 34q-27 1 -41.5 -27.5t-16.5 -59.5q-1 -15 3.5 -37t13 -37.5t15.5 -13.5q10 3 16 14q4 9 -7 8q-7 0 -15.5 14.5t-9.5 33.5q-1 22 9 37t34 14q17 0 27 -21t9.5 -39t-1.5 -22q-22 -15 -31 -29q-8 -12 -27.5 -23.5
+t-20.5 -12.5q-13 -14 -15.5 -27t7.5 -18q14 -8 25 -19.5t16 -19t18.5 -13t35.5 -6.5q47 -2 102 15q2 1 23 7t34.5 10.5t29.5 13t21 17.5q9 14 20 8q5 -3 6.5 -8.5t-3 -12t-16.5 -9.5q-20 -6 -56.5 -21.5t-45.5 -19.5q-44 -19 -70 -23q-25 -5 -79 2q-10 2 -9 -2t17 -19
+q25 -23 67 -22q17 1 36 7t36 14t33.5 17.5t30 17t24.5 12t17.5 2.5t8.5 -11q0 -2 -1 -4.5t-4 -5t-6 -4.5t-8.5 -5t-9 -4.5t-10 -5t-9.5 -4.5q-28 -14 -67.5 -44t-66.5 -43t-49 -1q-21 11 -63 73q-22 31 -25 22q-1 -3 -1 -10q0 -25 -15 -56.5t-29.5 -55.5t-21 -58t11.5 -63
+q-23 -6 -62.5 -90t-47.5 -141q-2 -18 -1.5 -69t-5.5 -59q-8 -24 -29 -3q-32 31 -36 94q-2 28 4 56q4 19 -1 18q-2 -1 -4 -5q-36 -65 10 -166q5 -12 25 -28t24 -20q20 -23 104 -90.5t93 -76.5q16 -15 17.5 -38t-14 -43t-45.5 -23q8 -15 29 -44.5t28 -54t7 -70.5q46 24 7 92
+q-4 8 -10.5 16t-9.5 12t-2 6q3 5 13 9.5t20 -2.5q46 -52 166 -36q133 15 177 87q23 38 34 30q12 -6 10 -52q-1 -25 -23 -92q-9 -23 -6 -37.5t24 -15.5q3 19 14.5 77t13.5 90q2 21 -6.5 73.5t-7.5 97t23 70.5q15 18 51 18q1 37 34.5 53t72.5 10.5t60 -22.5zM626 1152
+q3 17 -2.5 30t-11.5 15q-9 2 -9 -7q2 -5 5 -6q10 0 7 -15q-3 -20 8 -20q3 0 3 3zM1045 955q-2 8 -6.5 11.5t-13 5t-14.5 5.5q-5 3 -9.5 8t-7 8t-5.5 6.5t-4 4t-4 -1.5q-14 -16 7 -43.5t39 -31.5q9 -1 14.5 8t3.5 20zM867 1168q0 11 -5 19.5t-11 12.5t-9 3q-6 0 -8 -2t0 -4
+t5 -3q14 -4 18 -31q0 -3 8 2q2 2 2 3zM921 1401q0 2 -2.5 5t-9 7t-9.5 6q-15 15 -24 15q-9 -1 -11.5 -7.5t-1 -13t-0.5 -12.5q-1 -4 -6 -10.5t-6 -9t3 -8.5q4 -3 8 0t11 9t15 9q1 1 9 1t15 2t9 7zM1486 60q20 -12 31 -24.5t12 -24t-2.5 -22.5t-15.5 -22t-23.5 -19.5
+t-30 -18.5t-31.5 -16.5t-32 -15.5t-27 -13q-38 -19 -85.5 -56t-75.5 -64q-17 -16 -68 -19.5t-89 14.5q-18 9 -29.5 23.5t-16.5 25.5t-22 19.5t-47 9.5q-44 1 -130 1q-19 0 -57 -1.5t-58 -2.5q-44 -1 -79.5 -15t-53.5 -30t-43.5 -28.5t-53.5 -11.5q-29 1 -111 31t-146 43
+q-19 4 -51 9.5t-50 9t-39.5 9.5t-33.5 14.5t-17 19.5q-10 23 7 66.5t18 54.5q1 16 -4 40t-10 42.5t-4.5 36.5t10.5 27q14 12 57 14t60 12q30 18 42 35t12 51q21 -73 -32 -106q-32 -20 -83 -15q-34 3 -43 -10q-13 -15 5 -57q2 -6 8 -18t8.5 -18t4.5 -17t1 -22q0 -15 -17 -49
+t-14 -48q3 -17 37 -26q20 -6 84.5 -18.5t99.5 -20.5q24 -6 74 -22t82.5 -23t55.5 -4q43 6 64.5 28t23 48t-7.5 58.5t-19 52t-20 36.5q-121 190 -169 242q-68 74 -113 40q-11 -9 -15 15q-3 16 -2 38q1 29 10 52t24 47t22 42q8 21 26.5 72t29.5 78t30 61t39 54
+q110 143 124 195q-12 112 -16 310q-2 90 24 151.5t106 104.5q39 21 104 21q53 1 106 -13.5t89 -41.5q57 -42 91.5 -121.5t29.5 -147.5q-5 -95 30 -214q34 -113 133 -218q55 -59 99.5 -163t59.5 -191q8 -49 5 -84.5t-12 -55.5t-20 -22q-10 -2 -23.5 -19t-27 -35.5
+t-40.5 -33.5t-61 -14q-18 1 -31.5 5t-22.5 13.5t-13.5 15.5t-11.5 20.5t-9 19.5q-22 37 -41 30t-28 -49t7 -97q20 -70 1 -195q-10 -65 18 -100.5t73 -33t85 35.5q59 49 89.5 66.5t103.5 42.5q53 18 77 36.5t18.5 34.5t-25 28.5t-51.5 23.5q-33 11 -49.5 48t-15 72.5
+t15.5 47.5q1 -31 8 -56.5t14.5 -40.5t20.5 -28.5t21 -19t21.5 -13t16.5 -9.5z" />
+    <glyph glyph-name="dribble" unicode="&#xf17d;" 
+d="M1024 36q-42 241 -140 498h-2l-2 -1q-16 -6 -43 -16.5t-101 -49t-137 -82t-131 -114.5t-103 -148l-15 11q184 -150 418 -150q132 0 256 52zM839 643q-21 49 -53 111q-311 -93 -673 -93q-1 -7 -1 -21q0 -124 44 -236.5t124 -201.5q50 89 123.5 166.5t142.5 124.5t130.5 81
+t99.5 48l37 13q4 1 13 3.5t13 4.5zM732 855q-120 213 -244 378q-138 -65 -234 -186t-128 -272q302 0 606 80zM1416 536q-210 60 -409 29q87 -239 128 -469q111 75 185 189.5t96 250.5zM611 1277q-1 0 -2 -1q1 1 2 1zM1201 1132q-185 164 -433 164q-76 0 -155 -19
+q131 -170 246 -382q69 26 130 60.5t96.5 61.5t65.5 57t37.5 40.5zM1424 647q-3 232 -149 410l-1 -1q-9 -12 -19 -24.5t-43.5 -44.5t-71 -60.5t-100 -65t-131.5 -64.5q25 -53 44 -95q2 -5 6.5 -17t7.5 -17q36 5 74.5 7t73.5 2t69 -1.5t64 -4t56.5 -5.5t48 -6.5t36.5 -6
+t25 -4.5zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="skype" unicode="&#xf17e;" 
+d="M1173 473q0 50 -19.5 91.5t-48.5 68.5t-73 49t-82.5 34t-87.5 23l-104 24q-30 7 -44 10.5t-35 11.5t-30 16t-16.5 21t-7.5 30q0 77 144 77q43 0 77 -12t54 -28.5t38 -33.5t40 -29t48 -12q47 0 75.5 32t28.5 77q0 55 -56 99.5t-142 67.5t-182 23q-68 0 -132 -15.5
+t-119.5 -47t-89 -87t-33.5 -128.5q0 -61 19 -106.5t56 -75.5t80 -48.5t103 -32.5l146 -36q90 -22 112 -36q32 -20 32 -60q0 -39 -40 -64.5t-105 -25.5q-51 0 -91.5 16t-65 38.5t-45.5 45t-46 38.5t-54 16q-50 0 -75.5 -30t-25.5 -75q0 -92 122 -157.5t291 -65.5
+q73 0 140 18.5t122.5 53.5t88.5 93.5t33 131.5zM1536 256q0 -159 -112.5 -271.5t-271.5 -112.5q-130 0 -234 80q-77 -16 -150 -16q-143 0 -273.5 55.5t-225 150t-150 225t-55.5 273.5q0 73 16 150q-80 104 -80 234q0 159 112.5 271.5t271.5 112.5q130 0 234 -80
+q77 16 150 16q143 0 273.5 -55.5t225 -150t150 -225t55.5 -273.5q0 -73 -16 -150q80 -104 80 -234z" />
+    <glyph glyph-name="foursquare" unicode="&#xf180;" horiz-adv-x="1280" 
+d="M1000 1102l37 194q5 23 -9 40t-35 17h-712q-23 0 -38.5 -17t-15.5 -37v-1101q0 -7 6 -1l291 352q23 26 38 33.5t48 7.5h239q22 0 37 14.5t18 29.5q24 130 37 191q4 21 -11.5 40t-36.5 19h-294q-29 0 -48 19t-19 48v42q0 29 19 47.5t48 18.5h346q18 0 35 13.5t20 29.5z
+M1227 1324q-15 -73 -53.5 -266.5t-69.5 -350t-35 -173.5q-6 -22 -9 -32.5t-14 -32.5t-24.5 -33t-38.5 -21t-58 -10h-271q-13 0 -22 -10q-8 -9 -426 -494q-22 -25 -58.5 -28.5t-48.5 5.5q-55 22 -55 98v1410q0 55 38 102.5t120 47.5h888q95 0 127 -53t10 -159zM1227 1324
+l-158 -790q4 17 35 173.5t69.5 350t53.5 266.5z" />
+    <glyph glyph-name="trello" unicode="&#xf181;" 
+d="M704 192v1024q0 14 -9 23t-23 9h-480q-14 0 -23 -9t-9 -23v-1024q0 -14 9 -23t23 -9h480q14 0 23 9t9 23zM1376 576v640q0 14 -9 23t-23 9h-480q-14 0 -23 -9t-9 -23v-640q0 -14 9 -23t23 -9h480q14 0 23 9t9 23zM1536 1344v-1408q0 -26 -19 -45t-45 -19h-1408
+q-26 0 -45 19t-19 45v1408q0 26 19 45t45 19h1408q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="female" unicode="&#xf182;" horiz-adv-x="1280" 
+d="M1280 480q0 -40 -28 -68t-68 -28q-51 0 -80 43l-227 341h-45v-132l247 -411q9 -15 9 -33q0 -26 -19 -45t-45 -19h-192v-272q0 -46 -33 -79t-79 -33h-160q-46 0 -79 33t-33 79v272h-192q-26 0 -45 19t-19 45q0 18 9 33l247 411v132h-45l-227 -341q-29 -43 -80 -43
+q-40 0 -68 28t-28 68q0 29 16 53l256 384q73 107 176 107h384q103 0 176 -107l256 -384q16 -24 16 -53zM864 1280q0 -93 -65.5 -158.5t-158.5 -65.5t-158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5t158.5 -65.5t65.5 -158.5z" />
+    <glyph glyph-name="male" unicode="&#xf183;" horiz-adv-x="1024" 
+d="M1024 832v-416q0 -40 -28 -68t-68 -28t-68 28t-28 68v352h-64v-912q0 -46 -33 -79t-79 -33t-79 33t-33 79v464h-64v-464q0 -46 -33 -79t-79 -33t-79 33t-33 79v912h-64v-352q0 -40 -28 -68t-68 -28t-68 28t-28 68v416q0 80 56 136t136 56h640q80 0 136 -56t56 -136z
+M736 1280q0 -93 -65.5 -158.5t-158.5 -65.5t-158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5t158.5 -65.5t65.5 -158.5z" />
+    <glyph glyph-name="gittip" unicode="&#xf184;" 
+d="M773 234l350 473q16 22 24.5 59t-6 85t-61.5 79q-40 26 -83 25.5t-73.5 -17.5t-54.5 -45q-36 -40 -96 -40q-59 0 -95 40q-24 28 -54.5 45t-73.5 17.5t-84 -25.5q-46 -31 -60.5 -79t-6 -85t24.5 -59zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103
+t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="sun" unicode="&#xf185;" horiz-adv-x="1792" 
+d="M1472 640q0 117 -45.5 223.5t-123 184t-184 123t-223.5 45.5t-223.5 -45.5t-184 -123t-123 -184t-45.5 -223.5t45.5 -223.5t123 -184t184 -123t223.5 -45.5t223.5 45.5t184 123t123 184t45.5 223.5zM1748 363q-4 -15 -20 -20l-292 -96v-306q0 -16 -13 -26q-15 -10 -29 -4
+l-292 94l-180 -248q-10 -13 -26 -13t-26 13l-180 248l-292 -94q-14 -6 -29 4q-13 10 -13 26v306l-292 96q-16 5 -20 20q-5 17 4 29l180 248l-180 248q-9 13 -4 29q4 15 20 20l292 96v306q0 16 13 26q15 10 29 4l292 -94l180 248q9 12 26 12t26 -12l180 -248l292 94
+q14 6 29 -4q13 -10 13 -26v-306l292 -96q16 -5 20 -20q5 -16 -4 -29l-180 -248l180 -248q9 -12 4 -29z" />
+    <glyph glyph-name="_366" unicode="&#xf186;" 
+d="M1262 233q-54 -9 -110 -9q-182 0 -337 90t-245 245t-90 337q0 192 104 357q-201 -60 -328.5 -229t-127.5 -384q0 -130 51 -248.5t136.5 -204t204 -136.5t248.5 -51q144 0 273.5 61.5t220.5 171.5zM1465 318q-94 -203 -283.5 -324.5t-413.5 -121.5q-156 0 -298 61
+t-245 164t-164 245t-61 298q0 153 57.5 292.5t156 241.5t235.5 164.5t290 68.5q44 2 61 -39q18 -41 -15 -72q-86 -78 -131.5 -181.5t-45.5 -218.5q0 -148 73 -273t198 -198t273 -73q118 0 228 51q41 18 72 -13q14 -14 17.5 -34t-4.5 -38z" />
+    <glyph glyph-name="archive" unicode="&#xf187;" horiz-adv-x="1792" 
+d="M1088 704q0 26 -19 45t-45 19h-256q-26 0 -45 -19t-19 -45t19 -45t45 -19h256q26 0 45 19t19 45zM1664 896v-960q0 -26 -19 -45t-45 -19h-1408q-26 0 -45 19t-19 45v960q0 26 19 45t45 19h1408q26 0 45 -19t19 -45zM1728 1344v-256q0 -26 -19 -45t-45 -19h-1536
+q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h1536q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="bug" unicode="&#xf188;" horiz-adv-x="1664" 
+d="M1632 576q0 -26 -19 -45t-45 -19h-224q0 -171 -67 -290l208 -209q19 -19 19 -45t-19 -45q-18 -19 -45 -19t-45 19l-198 197q-5 -5 -15 -13t-42 -28.5t-65 -36.5t-82 -29t-97 -13v896h-128v-896q-51 0 -101.5 13.5t-87 33t-66 39t-43.5 32.5l-15 14l-183 -207
+q-20 -21 -48 -21q-24 0 -43 16q-19 18 -20.5 44.5t15.5 46.5l202 227q-58 114 -58 274h-224q-26 0 -45 19t-19 45t19 45t45 19h224v294l-173 173q-19 19 -19 45t19 45t45 19t45 -19l173 -173h844l173 173q19 19 45 19t45 -19t19 -45t-19 -45l-173 -173v-294h224q26 0 45 -19
+t19 -45zM1152 1152h-640q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5z" />
+    <glyph glyph-name="vk" unicode="&#xf189;" horiz-adv-x="1920" 
+d="M1917 1016q23 -64 -150 -294q-24 -32 -65 -85q-40 -51 -55 -72t-30.5 -49.5t-12 -42t13 -34.5t32.5 -43t57 -53q4 -2 5 -4q141 -131 191 -221q3 -5 6.5 -12.5t7 -26.5t-0.5 -34t-25 -27.5t-59 -12.5l-256 -4q-24 -5 -56 5t-52 22l-20 12q-30 21 -70 64t-68.5 77.5t-61 58
+t-56.5 15.5q-3 -1 -8 -3.5t-17 -14.5t-21.5 -29.5t-17 -52t-6.5 -77.5q0 -15 -3.5 -27.5t-7.5 -18.5l-4 -5q-18 -19 -53 -22h-115q-71 -4 -146 16.5t-131.5 53t-103 66t-70.5 57.5l-25 24q-10 10 -27.5 30t-71.5 91t-106 151t-122.5 211t-130.5 272q-6 16 -6 27t3 16l4 6
+q15 19 57 19l274 2q12 -2 23 -6.5t16 -8.5l5 -3q16 -11 24 -32q20 -50 46 -103.5t41 -81.5l16 -29q29 -60 56 -104t48.5 -68.5t41.5 -38.5t34 -14t27 5q2 1 5 5t12 22t13.5 47t9.5 81t0 125q-2 40 -9 73t-14 46l-6 12q-25 34 -85 43q-13 2 5 24q16 19 38 30q53 26 239 24
+q82 -1 135 -13q20 -5 33.5 -13.5t20.5 -24t10.5 -32t3.5 -45.5t-1 -55t-2.5 -70.5t-1.5 -82.5q0 -11 -1 -42t-0.5 -48t3.5 -40.5t11.5 -39t22.5 -24.5q8 -2 17 -4t26 11t38 34.5t52 67t68 107.5q60 104 107 225q4 10 10 17.5t11 10.5l4 3l5 2.5t13 3t20 0.5l288 2
+q39 5 64 -2.5t31 -16.5z" />
+    <glyph glyph-name="weibo" unicode="&#xf18a;" horiz-adv-x="1792" 
+d="M675 252q21 34 11 69t-45 50q-34 14 -73 1t-60 -46q-22 -34 -13 -68.5t43 -50.5t74.5 -2.5t62.5 47.5zM769 373q8 13 3.5 26.5t-17.5 18.5q-14 5 -28.5 -0.5t-21.5 -18.5q-17 -31 13 -45q14 -5 29 0.5t22 18.5zM943 266q-45 -102 -158 -150t-224 -12
+q-107 34 -147.5 126.5t6.5 187.5q47 93 151.5 139t210.5 19q111 -29 158.5 -119.5t2.5 -190.5zM1255 426q-9 96 -89 170t-208.5 109t-274.5 21q-223 -23 -369.5 -141.5t-132.5 -264.5q9 -96 89 -170t208.5 -109t274.5 -21q223 23 369.5 141.5t132.5 264.5zM1563 422
+q0 -68 -37 -139.5t-109 -137t-168.5 -117.5t-226 -83t-270.5 -31t-275 33.5t-240.5 93t-171.5 151t-65 199.5q0 115 69.5 245t197.5 258q169 169 341.5 236t246.5 -7q65 -64 20 -209q-4 -14 -1 -20t10 -7t14.5 0.5t13.5 3.5l6 2q139 59 246 59t153 -61q45 -63 0 -178
+q-2 -13 -4.5 -20t4.5 -12.5t12 -7.5t17 -6q57 -18 103 -47t80 -81.5t34 -116.5zM1489 1046q42 -47 54.5 -108.5t-6.5 -117.5q-8 -23 -29.5 -34t-44.5 -4q-23 8 -34 29.5t-4 44.5q20 63 -24 111t-107 35q-24 -5 -45 8t-25 37q-5 24 8 44.5t37 25.5q60 13 119 -5.5t101 -65.5z
+M1670 1209q87 -96 112.5 -222.5t-13.5 -241.5q-9 -27 -34 -40t-52 -4t-40 34t-5 52q28 82 10 172t-80 158q-62 69 -148 95.5t-173 8.5q-28 -6 -52 9.5t-30 43.5t9.5 51.5t43.5 29.5q123 26 244 -11.5t208 -134.5z" />
+    <glyph glyph-name="renren" unicode="&#xf18b;" 
+d="M1133 -34q-171 -94 -368 -94q-196 0 -367 94q138 87 235.5 211t131.5 268q35 -144 132.5 -268t235.5 -211zM638 1394v-485q0 -252 -126.5 -459.5t-330.5 -306.5q-181 215 -181 495q0 187 83.5 349.5t229.5 269.5t325 137zM1536 638q0 -280 -181 -495
+q-204 99 -330.5 306.5t-126.5 459.5v485q179 -30 325 -137t229.5 -269.5t83.5 -349.5z" />
+    <glyph glyph-name="_372" unicode="&#xf18c;" horiz-adv-x="1408" 
+d="M1402 433q-32 -80 -76 -138t-91 -88.5t-99 -46.5t-101.5 -14.5t-96.5 8.5t-86.5 22t-69.5 27.5t-46 22.5l-17 10q-113 -228 -289.5 -359.5t-384.5 -132.5q-19 0 -32 13t-13 32t13 31.5t32 12.5q173 1 322.5 107.5t251.5 294.5q-36 -14 -72 -23t-83 -13t-91 2.5t-93 28.5
+t-92 59t-84.5 100t-74.5 146q114 47 214 57t167.5 -7.5t124.5 -56.5t88.5 -77t56.5 -82q53 131 79 291q-7 -1 -18 -2.5t-46.5 -2.5t-69.5 0.5t-81.5 10t-88.5 23t-84 42.5t-75 65t-54.5 94.5t-28.5 127.5q70 28 133.5 36.5t112.5 -1t92 -30t73.5 -50t56 -61t42 -63t27.5 -56
+t16 -39.5l4 -16q12 122 12 195q-8 6 -21.5 16t-49 44.5t-63.5 71.5t-54 93t-33 112.5t12 127t70 138.5q73 -25 127.5 -61.5t84.5 -76.5t48 -85t20.5 -89t-0.5 -85.5t-13 -76.5t-19 -62t-17 -42l-7 -15q1 -4 1 -50t-1 -72q3 7 10 18.5t30.5 43t50.5 58t71 55.5t91.5 44.5
+t112 14.5t132.5 -24q-2 -78 -21.5 -141.5t-50 -104.5t-69.5 -71.5t-81.5 -45.5t-84.5 -24t-80 -9.5t-67.5 1t-46.5 4.5l-17 3q-23 -147 -73 -283q6 7 18 18.5t49.5 41t77.5 52.5t99.5 42t117.5 20t129 -23.5t137 -77.5z" />
+    <glyph glyph-name="stack_exchange" unicode="&#xf18d;" horiz-adv-x="1280" 
+d="M1259 283v-66q0 -85 -57.5 -144.5t-138.5 -59.5h-57l-260 -269v269h-529q-81 0 -138.5 59.5t-57.5 144.5v66h1238zM1259 609v-255h-1238v255h1238zM1259 937v-255h-1238v255h1238zM1259 1077v-67h-1238v67q0 84 57.5 143.5t138.5 59.5h846q81 0 138.5 -59.5t57.5 -143.5z
+" />
+    <glyph glyph-name="_374" unicode="&#xf18e;" 
+d="M1152 640q0 -14 -9 -23l-320 -320q-9 -9 -23 -9q-13 0 -22.5 9.5t-9.5 22.5v192h-352q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h352v192q0 14 9 23t23 9q12 0 24 -10l319 -319q9 -9 9 -23zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198
+t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="arrow_circle_alt_left" unicode="&#xf190;" 
+d="M1152 736v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-352v-192q0 -14 -9 -23t-23 -9q-12 0 -24 10l-319 319q-9 9 -9 23t9 23l320 320q9 9 23 9q13 0 22.5 -9.5t9.5 -22.5v-192h352q13 0 22.5 -9.5t9.5 -22.5zM1312 640q0 148 -73 273t-198 198t-273 73t-273 -73t-198 -198
+t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_376" unicode="&#xf191;" 
+d="M1024 960v-640q0 -26 -19 -45t-45 -19q-20 0 -37 12l-448 320q-27 19 -27 52t27 52l448 320q17 12 37 12q26 0 45 -19t19 -45zM1280 160v960q0 13 -9.5 22.5t-22.5 9.5h-960q-13 0 -22.5 -9.5t-9.5 -22.5v-960q0 -13 9.5 -22.5t22.5 -9.5h960q13 0 22.5 9.5t9.5 22.5z
+M1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="dot_circle_alt" unicode="&#xf192;" 
+d="M1024 640q0 -106 -75 -181t-181 -75t-181 75t-75 181t75 181t181 75t181 -75t75 -181zM768 1184q-148 0 -273 -73t-198 -198t-73 -273t73 -273t198 -198t273 -73t273 73t198 198t73 273t-73 273t-198 198t-273 73zM1536 640q0 -209 -103 -385.5t-279.5 -279.5
+t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_378" unicode="&#xf193;" horiz-adv-x="1664" 
+d="M1023 349l102 -204q-58 -179 -210 -290t-339 -111q-156 0 -288.5 77.5t-210 210t-77.5 288.5q0 181 104.5 330t274.5 211l17 -131q-122 -54 -195 -165.5t-73 -244.5q0 -185 131.5 -316.5t316.5 -131.5q126 0 232.5 65t165 175.5t49.5 236.5zM1571 249l58 -114l-256 -128
+q-13 -7 -29 -7q-40 0 -57 35l-239 477h-472q-24 0 -42.5 16.5t-21.5 40.5l-96 779q-2 17 6 42q14 51 57 82.5t97 31.5q66 0 113 -47t47 -113q0 -69 -52 -117.5t-120 -41.5l37 -289h423v-128h-407l16 -128h455q40 0 57 -35l228 -455z" />
+    <glyph glyph-name="vimeo_square" unicode="&#xf194;" 
+d="M1292 898q10 216 -161 222q-231 8 -312 -261q44 19 82 19q85 0 74 -96q-4 -57 -74 -167t-105 -110q-43 0 -82 169q-13 54 -45 255q-30 189 -160 177q-59 -7 -164 -100l-81 -72l-81 -72l52 -67q76 52 87 52q57 0 107 -179q15 -55 45 -164.5t45 -164.5q68 -179 164 -179
+q157 0 383 294q220 283 226 444zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_380" unicode="&#xf195;" horiz-adv-x="1152" 
+d="M1152 704q0 -191 -94.5 -353t-256.5 -256.5t-353 -94.5h-160q-14 0 -23 9t-9 23v611l-215 -66q-3 -1 -9 -1q-10 0 -19 6q-13 10 -13 26v128q0 23 23 31l233 71v93l-215 -66q-3 -1 -9 -1q-10 0 -19 6q-13 10 -13 26v128q0 23 23 31l233 71v250q0 14 9 23t23 9h160
+q14 0 23 -9t9 -23v-181l375 116q15 5 28 -5t13 -26v-128q0 -23 -23 -31l-393 -121v-93l375 116q15 5 28 -5t13 -26v-128q0 -23 -23 -31l-393 -121v-487q188 13 318 151t130 328q0 14 9 23t23 9h160q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="plus_square_o" unicode="&#xf196;" horiz-adv-x="1408" 
+d="M1152 736v-64q0 -14 -9 -23t-23 -9h-352v-352q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v352h-352q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h352v352q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-352h352q14 0 23 -9t9 -23zM1280 288v832q0 66 -47 113t-113 47h-832
+q-66 0 -113 -47t-47 -113v-832q0 -66 47 -113t113 -47h832q66 0 113 47t47 113zM1408 1120v-832q0 -119 -84.5 -203.5t-203.5 -84.5h-832q-119 0 -203.5 84.5t-84.5 203.5v832q0 119 84.5 203.5t203.5 84.5h832q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_382" unicode="&#xf197;" horiz-adv-x="2176" 
+d="M620 416q-110 -64 -268 -64h-128v64h-64q-13 0 -22.5 23.5t-9.5 56.5q0 24 7 49q-58 2 -96.5 10.5t-38.5 20.5t38.5 20.5t96.5 10.5q-7 25 -7 49q0 33 9.5 56.5t22.5 23.5h64v64h128q158 0 268 -64h1113q42 -7 106.5 -18t80.5 -14q89 -15 150 -40.5t83.5 -47.5t22.5 -40
+t-22.5 -40t-83.5 -47.5t-150 -40.5q-16 -3 -80.5 -14t-106.5 -18h-1113zM1739 668q53 -36 53 -92t-53 -92l81 -30q68 48 68 122t-68 122zM625 400h1015q-217 -38 -456 -80q-57 0 -113 -24t-83 -48l-28 -24l-288 -288q-26 -26 -70.5 -45t-89.5 -19h-96l-93 464h29
+q157 0 273 64zM352 816h-29l93 464h96q46 0 90 -19t70 -45l288 -288q4 -4 11 -10.5t30.5 -23t48.5 -29t61.5 -23t72.5 -10.5l456 -80h-1015q-116 64 -273 64z" />
+    <glyph glyph-name="_383" unicode="&#xf198;" horiz-adv-x="1664" 
+d="M1519 760q62 0 103.5 -40.5t41.5 -101.5q0 -97 -93 -130l-172 -59l56 -167q7 -21 7 -47q0 -59 -42 -102t-101 -43q-47 0 -85.5 27t-53.5 72l-55 165l-310 -106l55 -164q8 -24 8 -47q0 -59 -42 -102t-102 -43q-47 0 -85 27t-53 72l-55 163l-153 -53q-29 -9 -50 -9
+q-61 0 -101.5 40t-40.5 101q0 47 27.5 85t71.5 53l156 53l-105 313l-156 -54q-26 -8 -48 -8q-60 0 -101 40.5t-41 100.5q0 47 27.5 85t71.5 53l157 53l-53 159q-8 24 -8 47q0 60 42 102.5t102 42.5q47 0 85 -27t53 -72l54 -160l310 105l-54 160q-8 24 -8 47q0 59 42.5 102
+t101.5 43q47 0 85.5 -27.5t53.5 -71.5l53 -161l162 55q21 6 43 6q60 0 102.5 -39.5t42.5 -98.5q0 -45 -30 -81.5t-74 -51.5l-157 -54l105 -316l164 56q24 8 46 8zM725 498l310 105l-105 315l-310 -107z" />
+    <glyph glyph-name="_384" unicode="&#xf199;" 
+d="M1248 1408q119 0 203.5 -84.5t84.5 -203.5v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960zM1280 352v436q-31 -35 -64 -55q-34 -22 -132.5 -85t-151.5 -99q-98 -69 -164 -69v0v0q-66 0 -164 69
+q-47 32 -142 92.5t-142 92.5q-12 8 -33 27t-31 27v-436q0 -40 28 -68t68 -28h832q40 0 68 28t28 68zM1280 925q0 41 -27.5 70t-68.5 29h-832q-40 0 -68 -28t-28 -68q0 -37 30.5 -76.5t67.5 -64.5q47 -32 137.5 -89t129.5 -83q3 -2 17 -11.5t21 -14t21 -13t23.5 -13
+t21.5 -9.5t22.5 -7.5t20.5 -2.5t20.5 2.5t22.5 7.5t21.5 9.5t23.5 13t21 13t21 14t17 11.5l267 174q35 23 66.5 62.5t31.5 73.5z" />
+    <glyph glyph-name="_385" unicode="&#xf19a;" horiz-adv-x="1792" 
+d="M127 640q0 163 67 313l367 -1005q-196 95 -315 281t-119 411zM1415 679q0 -19 -2.5 -38.5t-10 -49.5t-11.5 -44t-17.5 -59t-17.5 -58l-76 -256l-278 826q46 3 88 8q19 2 26 18.5t-2.5 31t-28.5 13.5l-205 -10q-75 1 -202 10q-12 1 -20.5 -5t-11.5 -15t-1.5 -18.5t9 -16.5
+t19.5 -8l80 -8l120 -328l-168 -504l-280 832q46 3 88 8q19 2 26 18.5t-2.5 31t-28.5 13.5l-205 -10q-7 0 -23 0.5t-26 0.5q105 160 274.5 253.5t367.5 93.5q147 0 280.5 -53t238.5 -149h-10q-55 0 -92 -40.5t-37 -95.5q0 -12 2 -24t4 -21.5t8 -23t9 -21t12 -22.5t12.5 -21
+t14.5 -24t14 -23q63 -107 63 -212zM909 573l237 -647q1 -6 5 -11q-126 -44 -255 -44q-112 0 -217 32zM1570 1009q95 -174 95 -369q0 -209 -104 -385.5t-279 -278.5l235 678q59 169 59 276q0 42 -6 79zM896 1536q182 0 348 -71t286 -191t191 -286t71 -348t-71 -348t-191 -286
+t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71zM896 -215q173 0 331.5 68t273 182.5t182.5 273t68 331.5t-68 331.5t-182.5 273t-273 182.5t-331.5 68t-331.5 -68t-273 -182.5t-182.5 -273t-68 -331.5t68 -331.5t182.5 -273
+t273 -182.5t331.5 -68z" />
+    <glyph glyph-name="_386" unicode="&#xf19b;" horiz-adv-x="1792" 
+d="M1086 1536v-1536l-272 -128q-228 20 -414 102t-293 208.5t-107 272.5q0 140 100.5 263.5t275 205.5t391.5 108v-172q-217 -38 -356.5 -150t-139.5 -255q0 -152 154.5 -267t388.5 -145v1360zM1755 954l37 -390l-525 114l147 83q-119 70 -280 99v172q277 -33 481 -157z" />
+    <glyph glyph-name="_387" unicode="&#xf19c;" horiz-adv-x="2048" 
+d="M960 1536l960 -384v-128h-128q0 -26 -20.5 -45t-48.5 -19h-1526q-28 0 -48.5 19t-20.5 45h-128v128zM256 896h256v-768h128v768h256v-768h128v768h256v-768h128v768h256v-768h59q28 0 48.5 -19t20.5 -45v-64h-1664v64q0 26 20.5 45t48.5 19h59v768zM1851 -64
+q28 0 48.5 -19t20.5 -45v-128h-1920v128q0 26 20.5 45t48.5 19h1782z" />
+    <glyph glyph-name="_388" unicode="&#xf19d;" horiz-adv-x="2304" 
+d="M1774 700l18 -316q4 -69 -82 -128t-235 -93.5t-323 -34.5t-323 34.5t-235 93.5t-82 128l18 316l574 -181q22 -7 48 -7t48 7zM2304 1024q0 -23 -22 -31l-1120 -352q-4 -1 -10 -1t-10 1l-652 206q-43 -34 -71 -111.5t-34 -178.5q63 -36 63 -109q0 -69 -58 -107l58 -433
+q2 -14 -8 -25q-9 -11 -24 -11h-192q-15 0 -24 11q-10 11 -8 25l58 433q-58 38 -58 107q0 73 65 111q11 207 98 330l-333 104q-22 8 -22 31t22 31l1120 352q4 1 10 1t10 -1l1120 -352q22 -8 22 -31z" />
+    <glyph glyph-name="_389" unicode="&#xf19e;" 
+d="M859 579l13 -707q-62 11 -105 11q-41 0 -105 -11l13 707q-40 69 -168.5 295.5t-216.5 374.5t-181 287q58 -15 108 -15q44 0 111 15q63 -111 133.5 -229.5t167 -276.5t138.5 -227q37 61 109.5 177.5t117.5 190t105 176t107 189.5q54 -14 107 -14q56 0 114 14v0
+q-28 -39 -60 -88.5t-49.5 -78.5t-56.5 -96t-49 -84q-146 -248 -353 -610z" />
+    <glyph glyph-name="uniF1A0" unicode="&#xf1a0;" 
+d="M768 750h725q12 -67 12 -128q0 -217 -91 -387.5t-259.5 -266.5t-386.5 -96q-157 0 -299 60.5t-245 163.5t-163.5 245t-60.5 299t60.5 299t163.5 245t245 163.5t299 60.5q300 0 515 -201l-209 -201q-123 119 -306 119q-129 0 -238.5 -65t-173.5 -176.5t-64 -243.5
+t64 -243.5t173.5 -176.5t238.5 -65q87 0 160 24t120 60t82 82t51.5 87t22.5 78h-436v264z" />
+    <glyph glyph-name="f1a1" unicode="&#xf1a1;" horiz-adv-x="1792" 
+d="M1095 369q16 -16 0 -31q-62 -62 -199 -62t-199 62q-16 15 0 31q6 6 15 6t15 -6q48 -49 169 -49q120 0 169 49q6 6 15 6t15 -6zM788 550q0 -37 -26 -63t-63 -26t-63.5 26t-26.5 63q0 38 26.5 64t63.5 26t63 -26.5t26 -63.5zM1183 550q0 -37 -26.5 -63t-63.5 -26t-63 26
+t-26 63t26 63.5t63 26.5t63.5 -26t26.5 -64zM1434 670q0 49 -35 84t-85 35t-86 -36q-130 90 -311 96l63 283l200 -45q0 -37 26 -63t63 -26t63.5 26.5t26.5 63.5t-26.5 63.5t-63.5 26.5q-54 0 -80 -50l-221 49q-19 5 -25 -16l-69 -312q-180 -7 -309 -97q-35 37 -87 37
+q-50 0 -85 -35t-35 -84q0 -35 18.5 -64t49.5 -44q-6 -27 -6 -56q0 -142 140 -243t337 -101q198 0 338 101t140 243q0 32 -7 57q30 15 48 43.5t18 63.5zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191
+t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="_392" unicode="&#xf1a2;" 
+d="M939 407q13 -13 0 -26q-53 -53 -171 -53t-171 53q-13 13 0 26q5 6 13 6t13 -6q42 -42 145 -42t145 42q5 6 13 6t13 -6zM676 563q0 -31 -23 -54t-54 -23t-54 23t-23 54q0 32 22.5 54.5t54.5 22.5t54.5 -22.5t22.5 -54.5zM1014 563q0 -31 -23 -54t-54 -23t-54 23t-23 54
+q0 32 22.5 54.5t54.5 22.5t54.5 -22.5t22.5 -54.5zM1229 666q0 42 -30 72t-73 30q-42 0 -73 -31q-113 78 -267 82l54 243l171 -39q1 -32 23.5 -54t53.5 -22q32 0 54.5 22.5t22.5 54.5t-22.5 54.5t-54.5 22.5q-48 0 -69 -43l-189 42q-17 5 -21 -13l-60 -268q-154 -6 -265 -83
+q-30 32 -74 32q-43 0 -73 -30t-30 -72q0 -30 16 -55t42 -38q-5 -25 -5 -48q0 -122 120 -208.5t289 -86.5q170 0 290 86.5t120 208.5q0 25 -6 49q25 13 40.5 37.5t15.5 54.5zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960
+q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_393" unicode="&#xf1a3;" 
+d="M866 697l90 27v62q0 79 -58 135t-138 56t-138 -55.5t-58 -134.5v-283q0 -20 -14 -33.5t-33 -13.5t-32.5 13.5t-13.5 33.5v120h-151v-122q0 -82 57.5 -139t139.5 -57q81 0 138.5 56.5t57.5 136.5v280q0 19 13.5 33t33.5 14q19 0 32.5 -14t13.5 -33v-54zM1199 502v122h-150
+v-126q0 -20 -13.5 -33.5t-33.5 -13.5q-19 0 -32.5 14t-13.5 33v123l-90 -26l-60 28v-123q0 -80 58 -137t139 -57t138.5 57t57.5 139zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103
+t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="f1a4" unicode="&#xf1a4;" horiz-adv-x="1920" 
+d="M1062 824v118q0 42 -30 72t-72 30t-72 -30t-30 -72v-612q0 -175 -126 -299t-303 -124q-178 0 -303.5 125.5t-125.5 303.5v266h328v-262q0 -43 30 -72.5t72 -29.5t72 29.5t30 72.5v620q0 171 126.5 292t301.5 121q176 0 302 -122t126 -294v-136l-195 -58zM1592 602h328
+v-266q0 -178 -125.5 -303.5t-303.5 -125.5q-177 0 -303 124.5t-126 300.5v268l131 -61l195 58v-270q0 -42 30 -71.5t72 -29.5t72 29.5t30 71.5v275z" />
+    <glyph glyph-name="_395" unicode="&#xf1a5;" 
+d="M1472 160v480h-704v704h-480q-93 0 -158.5 -65.5t-65.5 -158.5v-480h704v-704h480q93 0 158.5 65.5t65.5 158.5zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5
+t84.5 -203.5z" />
+    <glyph glyph-name="_396" unicode="&#xf1a6;" horiz-adv-x="2048" 
+d="M328 1254h204v-983h-532v697h328v286zM328 435v369h-123v-369h123zM614 968v-697h205v697h-205zM614 1254v-204h205v204h-205zM901 968h533v-942h-533v163h328v82h-328v697zM1229 435v369h-123v-369h123zM1516 968h532v-942h-532v163h327v82h-327v697zM1843 435v369h-123
+v-369h123z" />
+    <glyph glyph-name="_397" unicode="&#xf1a7;" 
+d="M1046 516q0 -64 -38 -109t-91 -45q-43 0 -70 15v277q28 17 70 17q53 0 91 -45.5t38 -109.5zM703 944q0 -64 -38 -109.5t-91 -45.5q-43 0 -70 15v277q28 17 70 17q53 0 91 -45t38 -109zM1265 513q0 134 -88 229t-213 95q-20 0 -39 -3q-23 -78 -78 -136q-87 -95 -211 -101
+v-636l211 41v206q51 -19 117 -19q125 0 213 95t88 229zM922 940q0 134 -88.5 229t-213.5 95q-74 0 -141 -36h-186v-840l211 41v206q55 -19 116 -19q125 0 213.5 95t88.5 229zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960
+q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_398" unicode="&#xf1a8;" horiz-adv-x="2038" 
+d="M1222 607q75 3 143.5 -20.5t118 -58.5t101 -94.5t84 -108t75.5 -120.5q33 -56 78.5 -109t75.5 -80.5t99 -88.5q-48 -30 -108.5 -57.5t-138.5 -59t-114 -47.5q-44 37 -74 115t-43.5 164.5t-33 180.5t-42.5 168.5t-72.5 123t-122.5 48.5l-10 -2l-6 -4q4 -5 13 -14
+q6 -5 28 -23.5t25.5 -22t19 -18t18 -20.5t11.5 -21t10.5 -27.5t4.5 -31t4 -40.5l1 -33q1 -26 -2.5 -57.5t-7.5 -52t-12.5 -58.5t-11.5 -53q-35 1 -101 -9.5t-98 -10.5q-39 0 -72 10q-2 16 -2 47q0 74 3 96q2 13 31.5 41.5t57 59t26.5 51.5q-24 2 -43 -24
+q-36 -53 -111.5 -99.5t-136.5 -46.5q-25 0 -75.5 63t-106.5 139.5t-84 96.5q-6 4 -27 30q-482 -112 -513 -112q-16 0 -28 11t-12 27q0 15 8.5 26.5t22.5 14.5l486 106q-8 14 -8 25t5.5 17.5t16 11.5t20 7t23 4.5t18.5 4.5q4 1 15.5 7.5t17.5 6.5q15 0 28 -16t20 -33
+q163 37 172 37q17 0 29.5 -11t12.5 -28q0 -15 -8.5 -26t-23.5 -14l-182 -40l-1 -16q-1 -26 81.5 -117.5t104.5 -91.5q47 0 119 80t72 129q0 36 -23.5 53t-51 18.5t-51 11.5t-23.5 34q0 16 10 34l-68 19q43 44 43 117q0 26 -5 58q82 16 144 16q44 0 71.5 -1.5t48.5 -8.5
+t31 -13.5t20.5 -24.5t15.5 -33.5t17 -47.5t24 -60l50 25q-3 -40 -23 -60t-42.5 -21t-40 -6.5t-16.5 -20.5zM1282 842q-5 5 -13.5 15.5t-12 14.5t-10.5 11.5t-10 10.5l-8 8t-8.5 7.5t-8 5t-8.5 4.5q-7 3 -14.5 5t-20.5 2.5t-22 0.5h-32.5h-37.5q-126 0 -217 -43
+q16 30 36 46.5t54 29.5t65.5 36t46 36.5t50 55t43.5 50.5q12 -9 28 -31.5t32 -36.5t38 -13l12 1v-76l22 -1q247 95 371 190q28 21 50 39t42.5 37.5t33 31t29.5 34t24 31t24.5 37t23 38t27 47.5t29.5 53l7 9q-2 -53 -43 -139q-79 -165 -205 -264t-306 -142q-14 -3 -42 -7.5
+t-50 -9.5t-39 -14q3 -19 24.5 -46t21.5 -34q0 -11 -26 -30zM1061 -79q39 26 131.5 47.5t146.5 21.5q9 0 22.5 -15.5t28 -42.5t26 -50t24 -51t14.5 -33q-121 -45 -244 -45q-61 0 -125 11zM822 568l48 12l109 -177l-73 -48zM1323 51q3 -15 3 -16q0 -7 -17.5 -14.5t-46 -13
+t-54 -9.5t-53.5 -7.5t-32 -4.5l-7 43q21 2 60.5 8.5t72 10t60.5 3.5h14zM866 679l-96 -20l-6 17q10 1 32.5 7t34.5 6q19 0 35 -10zM1061 45h31l10 -83l-41 -12v95zM1950 1535v1v-1zM1950 1535l-1 -5l-2 -2l1 3zM1950 1535l1 1z" />
+    <glyph glyph-name="_399" unicode="&#xf1a9;" 
+d="M1167 -50q-5 19 -24 5q-30 -22 -87 -39t-131 -17q-129 0 -193 49q-5 4 -13 4q-11 0 -26 -12q-7 -6 -7.5 -16t7.5 -20q34 -32 87.5 -46t102.5 -12.5t99 4.5q41 4 84.5 20.5t65 30t28.5 20.5q12 12 7 29zM1128 65q-19 47 -39 61q-23 15 -76 15q-47 0 -71 -10
+q-29 -12 -78 -56q-26 -24 -12 -44q9 -8 17.5 -4.5t31.5 23.5q3 2 10.5 8.5t10.5 8.5t10 7t11.5 7t12.5 5t15 4.5t16.5 2.5t20.5 1q27 0 44.5 -7.5t23 -14.5t13.5 -22q10 -17 12.5 -20t12.5 1q23 12 14 34zM1483 346q0 22 -5 44.5t-16.5 45t-34 36.5t-52.5 14
+q-33 0 -97 -41.5t-129 -83.5t-101 -42q-27 -1 -63.5 19t-76 49t-83.5 58t-100 49t-111 19q-115 -1 -197 -78.5t-84 -178.5q-2 -112 74 -164q29 -20 62.5 -28.5t103.5 -8.5q57 0 132 32.5t134 71t120 70.5t93 31q26 -1 65 -31.5t71.5 -67t68 -67.5t55.5 -32q35 -3 58.5 14
+t55.5 63q28 41 42.5 101t14.5 106zM1536 506q0 -164 -62 -304.5t-166 -236t-242.5 -149.5t-290.5 -54t-293 57.5t-247.5 157t-170.5 241.5t-64 302q0 89 19.5 172.5t49 145.5t70.5 118.5t78.5 94t78.5 69.5t64.5 46.5t42.5 24.5q14 8 51 26.5t54.5 28.5t48 30t60.5 44
+q36 28 58 72.5t30 125.5q129 -155 186 -193q44 -29 130 -68t129 -66q21 -13 39 -25t60.5 -46.5t76 -70.5t75 -95t69 -122t47 -148.5t19.5 -177.5z" />
+    <glyph glyph-name="_400" unicode="&#xf1aa;" 
+d="M1070 463l-160 -160l-151 -152l-30 -30q-65 -64 -151.5 -87t-171.5 -2q-16 -70 -72 -115t-129 -45q-85 0 -145 60.5t-60 145.5q0 72 44.5 128t113.5 72q-22 86 1 173t88 152l12 12l151 -152l-11 -11q-37 -37 -37 -89t37 -90q37 -37 89 -37t89 37l30 30l151 152l161 160z
+M729 1145l12 -12l-152 -152l-12 12q-37 37 -89 37t-89 -37t-37 -89.5t37 -89.5l29 -29l152 -152l160 -160l-151 -152l-161 160l-151 152l-30 30q-68 67 -90 159.5t5 179.5q-70 15 -115 71t-45 129q0 85 60 145.5t145 60.5q76 0 133.5 -49t69.5 -123q84 20 169.5 -3.5
+t149.5 -87.5zM1536 78q0 -85 -60 -145.5t-145 -60.5q-74 0 -131 47t-71 118q-86 -28 -179.5 -6t-161.5 90l-11 12l151 152l12 -12q37 -37 89 -37t89 37t37 89t-37 89l-30 30l-152 152l-160 160l152 152l160 -160l152 -152l29 -30q64 -64 87.5 -150.5t2.5 -171.5
+q76 -11 126.5 -68.5t50.5 -134.5zM1534 1202q0 -77 -51 -135t-127 -69q26 -85 3 -176.5t-90 -158.5l-12 -12l-151 152l12 12q37 37 37 89t-37 89t-89 37t-89 -37l-30 -30l-152 -152l-160 -160l-152 152l161 160l152 152l29 30q67 67 159 89.5t178 -3.5q11 75 68.5 126
+t135.5 51q85 0 145 -60.5t60 -145.5z" />
+    <glyph glyph-name="f1ab" unicode="&#xf1ab;" 
+d="M654 458q-1 -3 -12.5 0.5t-31.5 11.5l-20 9q-44 20 -87 49q-7 5 -41 31.5t-38 28.5q-67 -103 -134 -181q-81 -95 -105 -110q-4 -2 -19.5 -4t-18.5 0q6 4 82 92q21 24 85.5 115t78.5 118q17 30 51 98.5t36 77.5q-8 1 -110 -33q-8 -2 -27.5 -7.5t-34.5 -9.5t-17 -5
+q-2 -2 -2 -10.5t-1 -9.5q-5 -10 -31 -15q-23 -7 -47 0q-18 4 -28 21q-4 6 -5 23q6 2 24.5 5t29.5 6q58 16 105 32q100 35 102 35q10 2 43 19.5t44 21.5q9 3 21.5 8t14.5 5.5t6 -0.5q2 -12 -1 -33q0 -2 -12.5 -27t-26.5 -53.5t-17 -33.5q-25 -50 -77 -131l64 -28
+q12 -6 74.5 -32t67.5 -28q4 -1 10.5 -25.5t4.5 -30.5zM449 944q3 -15 -4 -28q-12 -23 -50 -38q-30 -12 -60 -12q-26 3 -49 26q-14 15 -18 41l1 3q3 -3 19.5 -5t26.5 0t58 16q36 12 55 14q17 0 21 -17zM1147 815l63 -227l-139 42zM39 15l694 232v1032l-694 -233v-1031z
+M1280 332l102 -31l-181 657l-100 31l-216 -536l102 -31l45 110l211 -65zM777 1294l573 -184v380zM1088 -29l158 -13l-54 -160l-40 66q-130 -83 -276 -108q-58 -12 -91 -12h-84q-79 0 -199.5 39t-183.5 85q-8 7 -8 16q0 8 5 13.5t13 5.5q4 0 18 -7.5t30.5 -16.5t20.5 -11
+q73 -37 159.5 -61.5t157.5 -24.5q95 0 167 14.5t157 50.5q15 7 30.5 15.5t34 19t28.5 16.5zM1536 1050v-1079l-774 246q-14 -6 -375 -127.5t-368 -121.5q-13 0 -18 13q0 1 -1 3v1078q3 9 4 10q5 6 20 11q107 36 149 50v384l558 -198q2 0 160.5 55t316 108.5t161.5 53.5
+q20 0 20 -21v-418z" />
+    <glyph glyph-name="_402" unicode="&#xf1ac;" horiz-adv-x="1792" 
+d="M288 1152q66 0 113 -47t47 -113v-1088q0 -66 -47 -113t-113 -47h-128q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h128zM1664 989q58 -34 93 -93t35 -128v-768q0 -106 -75 -181t-181 -75h-864q-66 0 -113 47t-47 113v1536q0 40 28 68t68 28h672q40 0 88 -20t76 -48
+l152 -152q28 -28 48 -76t20 -88v-163zM928 0v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM928 256v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM928 512v128q0 14 -9 23
+t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1184 0v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1184 256v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128
+q14 0 23 9t9 23zM1184 512v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1440 0v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1440 256v128q0 14 -9 23t-23 9h-128
+q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1440 512v128q0 14 -9 23t-23 9h-128q-14 0 -23 -9t-9 -23v-128q0 -14 9 -23t23 -9h128q14 0 23 9t9 23zM1536 896v256h-160q-40 0 -68 28t-28 68v160h-640v-512h896z" />
+    <glyph glyph-name="_403" unicode="&#xf1ad;" 
+d="M1344 1536q26 0 45 -19t19 -45v-1664q0 -26 -19 -45t-45 -19h-1280q-26 0 -45 19t-19 45v1664q0 26 19 45t45 19h1280zM512 1248v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM512 992v-64q0 -14 9 -23t23 -9h64q14 0 23 9
+t9 23v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM512 736v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM512 480v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM384 160v64
+q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM384 416v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM384 672v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64
+q14 0 23 9t9 23zM384 928v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM384 1184v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM896 -96v192q0 14 -9 23t-23 9h-320q-14 0 -23 -9
+t-9 -23v-192q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM896 416v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM896 672v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM896 928v64
+q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM896 1184v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1152 160v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64
+q14 0 23 9t9 23zM1152 416v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1152 672v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1152 928v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9
+t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1152 1184v64q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h64q14 0 23 9t9 23z" />
+    <glyph glyph-name="_404" unicode="&#xf1ae;" horiz-adv-x="1280" 
+d="M1188 988l-292 -292v-824q0 -46 -33 -79t-79 -33t-79 33t-33 79v384h-64v-384q0 -46 -33 -79t-79 -33t-79 33t-33 79v824l-292 292q-28 28 -28 68t28 68q29 28 68.5 28t67.5 -28l228 -228h368l228 228q28 28 68 28t68 -28q28 -29 28 -68.5t-28 -67.5zM864 1152
+q0 -93 -65.5 -158.5t-158.5 -65.5t-158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5t158.5 -65.5t65.5 -158.5z" />
+    <glyph glyph-name="uniF1B1" unicode="&#xf1b0;" horiz-adv-x="1664" 
+d="M780 1064q0 -60 -19 -113.5t-63 -92.5t-105 -39q-76 0 -138 57.5t-92 135.5t-30 151q0 60 19 113.5t63 92.5t105 39q77 0 138.5 -57.5t91.5 -135t30 -151.5zM438 581q0 -80 -42 -139t-119 -59q-76 0 -141.5 55.5t-100.5 133.5t-35 152q0 80 42 139.5t119 59.5
+q76 0 141.5 -55.5t100.5 -134t35 -152.5zM832 608q118 0 255 -97.5t229 -237t92 -254.5q0 -46 -17 -76.5t-48.5 -45t-64.5 -20t-76 -5.5q-68 0 -187.5 45t-182.5 45q-66 0 -192.5 -44.5t-200.5 -44.5q-183 0 -183 146q0 86 56 191.5t139.5 192.5t187.5 146t193 59zM1071 819
+q-61 0 -105 39t-63 92.5t-19 113.5q0 74 30 151.5t91.5 135t138.5 57.5q61 0 105 -39t63 -92.5t19 -113.5q0 -73 -30 -151t-92 -135.5t-138 -57.5zM1503 923q77 0 119 -59.5t42 -139.5q0 -74 -35 -152t-100.5 -133.5t-141.5 -55.5q-77 0 -119 59t-42 139q0 74 35 152.5
+t100.5 134t141.5 55.5z" />
+    <glyph glyph-name="_406" unicode="&#xf1b1;" horiz-adv-x="768" 
+d="M704 1008q0 -145 -57 -243.5t-152 -135.5l45 -821q2 -26 -16 -45t-44 -19h-192q-26 0 -44 19t-16 45l45 821q-95 37 -152 135.5t-57 243.5q0 128 42.5 249.5t117.5 200t160 78.5t160 -78.5t117.5 -200t42.5 -249.5z" />
+    <glyph glyph-name="_407" unicode="&#xf1b2;" horiz-adv-x="1792" 
+d="M896 -93l640 349v636l-640 -233v-752zM832 772l698 254l-698 254l-698 -254zM1664 1024v-768q0 -35 -18 -65t-49 -47l-704 -384q-28 -16 -61 -16t-61 16l-704 384q-31 17 -49 47t-18 65v768q0 40 23 73t61 47l704 256q22 8 44 8t44 -8l704 -256q38 -14 61 -47t23 -73z
+" />
+    <glyph glyph-name="_408" unicode="&#xf1b3;" horiz-adv-x="2304" 
+d="M640 -96l384 192v314l-384 -164v-342zM576 358l404 173l-404 173l-404 -173zM1664 -96l384 192v314l-384 -164v-342zM1600 358l404 173l-404 173l-404 -173zM1152 651l384 165v266l-384 -164v-267zM1088 1030l441 189l-441 189l-441 -189zM2176 512v-416q0 -36 -19 -67
+t-52 -47l-448 -224q-25 -14 -57 -14t-57 14l-448 224q-4 2 -7 4q-2 -2 -7 -4l-448 -224q-25 -14 -57 -14t-57 14l-448 224q-33 16 -52 47t-19 67v416q0 38 21.5 70t56.5 48l434 186v400q0 38 21.5 70t56.5 48l448 192q23 10 50 10t50 -10l448 -192q35 -16 56.5 -48t21.5 -70
+v-400l434 -186q36 -16 57 -48t21 -70z" />
+    <glyph glyph-name="_409" unicode="&#xf1b4;" horiz-adv-x="2048" 
+d="M1848 1197h-511v-124h511v124zM1596 771q-90 0 -146 -52.5t-62 -142.5h408q-18 195 -200 195zM1612 186q63 0 122 32t76 87h221q-100 -307 -427 -307q-214 0 -340.5 132t-126.5 347q0 208 130.5 345.5t336.5 137.5q138 0 240.5 -68t153 -179t50.5 -248q0 -17 -2 -47h-658
+q0 -111 57.5 -171.5t166.5 -60.5zM277 236h296q205 0 205 167q0 180 -199 180h-302v-347zM277 773h281q78 0 123.5 36.5t45.5 113.5q0 144 -190 144h-260v-294zM0 1282h594q87 0 155 -14t126.5 -47.5t90 -96.5t31.5 -154q0 -181 -172 -263q114 -32 172 -115t58 -204
+q0 -75 -24.5 -136.5t-66 -103.5t-98.5 -71t-121 -42t-134 -13h-611v1260z" />
+    <glyph glyph-name="_410" unicode="&#xf1b5;" 
+d="M1248 1408q119 0 203.5 -84.5t84.5 -203.5v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960zM499 1041h-371v-787h382q117 0 197 57.5t80 170.5q0 158 -143 200q107 52 107 164q0 57 -19.5 96.5
+t-56.5 60.5t-79 29.5t-97 8.5zM477 723h-176v184h163q119 0 119 -90q0 -94 -106 -94zM486 388h-185v217h189q124 0 124 -113q0 -104 -128 -104zM1136 356q-68 0 -104 38t-36 107h411q1 10 1 30q0 132 -74.5 220.5t-203.5 88.5q-128 0 -210 -86t-82 -216q0 -135 79 -217
+t213 -82q205 0 267 191h-138q-11 -34 -47.5 -54t-75.5 -20zM1126 722q113 0 124 -122h-254q4 56 39 89t91 33zM964 988h319v-77h-319v77z" />
+    <glyph glyph-name="_411" unicode="&#xf1b6;" horiz-adv-x="1792" 
+d="M1582 954q0 -101 -71.5 -172.5t-172.5 -71.5t-172.5 71.5t-71.5 172.5t71.5 172.5t172.5 71.5t172.5 -71.5t71.5 -172.5zM812 212q0 104 -73 177t-177 73q-27 0 -54 -6l104 -42q77 -31 109.5 -106.5t1.5 -151.5q-31 -77 -107 -109t-152 -1q-21 8 -62 24.5t-61 24.5
+q32 -60 91 -96.5t130 -36.5q104 0 177 73t73 177zM1642 953q0 126 -89.5 215.5t-215.5 89.5q-127 0 -216.5 -89.5t-89.5 -215.5q0 -127 89.5 -216t216.5 -89q126 0 215.5 89t89.5 216zM1792 953q0 -189 -133.5 -322t-321.5 -133l-437 -319q-12 -129 -109 -218t-229 -89
+q-121 0 -214 76t-118 192l-230 92v429l389 -157q79 48 173 48q13 0 35 -2l284 407q2 187 135.5 319t320.5 132q188 0 321.5 -133.5t133.5 -321.5z" />
+    <glyph glyph-name="_412" unicode="&#xf1b7;" 
+d="M1242 889q0 80 -57 136.5t-137 56.5t-136.5 -57t-56.5 -136q0 -80 56.5 -136.5t136.5 -56.5t137 56.5t57 136.5zM632 301q0 -83 -58 -140.5t-140 -57.5q-56 0 -103 29t-72 77q52 -20 98 -40q60 -24 120 1.5t85 86.5q24 60 -1.5 120t-86.5 84l-82 33q22 5 42 5
+q82 0 140 -57.5t58 -140.5zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v153l172 -69q20 -92 93.5 -152t168.5 -60q104 0 181 70t87 173l345 252q150 0 255.5 105.5t105.5 254.5q0 150 -105.5 255.5t-255.5 105.5
+q-148 0 -253 -104.5t-107 -252.5l-225 -322q-9 1 -28 1q-75 0 -137 -37l-297 119v468q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5zM1289 887q0 -100 -71 -170.5t-171 -70.5t-170.5 70.5t-70.5 170.5t70.5 171t170.5 71q101 0 171.5 -70.5t70.5 -171.5z
+" />
+    <glyph glyph-name="_413" unicode="&#xf1b8;" horiz-adv-x="1792" 
+d="M836 367l-15 -368l-2 -22l-420 29q-36 3 -67 31.5t-47 65.5q-11 27 -14.5 55t4 65t12 55t21.5 64t19 53q78 -12 509 -28zM449 953l180 -379l-147 92q-63 -72 -111.5 -144.5t-72.5 -125t-39.5 -94.5t-18.5 -63l-4 -21l-190 357q-17 26 -18 56t6 47l8 18q35 63 114 188
+l-140 86zM1680 436l-188 -359q-12 -29 -36.5 -46.5t-43.5 -20.5l-18 -4q-71 -7 -219 -12l8 -164l-230 367l211 362l7 -173q170 -16 283 -5t170 33zM895 1360q-47 -63 -265 -435l-317 187l-19 12l225 356q20 31 60 45t80 10q24 -2 48.5 -12t42 -21t41.5 -33t36 -34.5
+t36 -39.5t32 -35zM1550 1053l212 -363q18 -37 12.5 -76t-27.5 -74q-13 -20 -33 -37t-38 -28t-48.5 -22t-47 -16t-51.5 -14t-46 -12q-34 72 -265 436l313 195zM1407 1279l142 83l-220 -373l-419 20l151 86q-34 89 -75 166t-75.5 123.5t-64.5 80t-47 46.5l-17 13l405 -1
+q31 3 58 -10.5t39 -28.5l11 -15q39 -61 112 -190z" />
+    <glyph glyph-name="_414" unicode="&#xf1b9;" horiz-adv-x="2048" 
+d="M480 448q0 66 -47 113t-113 47t-113 -47t-47 -113t47 -113t113 -47t113 47t47 113zM516 768h1016l-89 357q-2 8 -14 17.5t-21 9.5h-768q-9 0 -21 -9.5t-14 -17.5zM1888 448q0 66 -47 113t-113 47t-113 -47t-47 -113t47 -113t113 -47t113 47t47 113zM2048 544v-384
+q0 -14 -9 -23t-23 -9h-96v-128q0 -80 -56 -136t-136 -56t-136 56t-56 136v128h-1024v-128q0 -80 -56 -136t-136 -56t-136 56t-56 136v128h-96q-14 0 -23 9t-9 23v384q0 93 65.5 158.5t158.5 65.5h28l105 419q23 94 104 157.5t179 63.5h768q98 0 179 -63.5t104 -157.5
+l105 -419h28q93 0 158.5 -65.5t65.5 -158.5z" />
+    <glyph glyph-name="_415" unicode="&#xf1ba;" horiz-adv-x="2048" 
+d="M1824 640q93 0 158.5 -65.5t65.5 -158.5v-384q0 -14 -9 -23t-23 -9h-96v-64q0 -80 -56 -136t-136 -56t-136 56t-56 136v64h-1024v-64q0 -80 -56 -136t-136 -56t-136 56t-56 136v64h-96q-14 0 -23 9t-9 23v384q0 93 65.5 158.5t158.5 65.5h28l105 419q23 94 104 157.5
+t179 63.5h128v224q0 14 9 23t23 9h448q14 0 23 -9t9 -23v-224h128q98 0 179 -63.5t104 -157.5l105 -419h28zM320 160q66 0 113 47t47 113t-47 113t-113 47t-113 -47t-47 -113t47 -113t113 -47zM516 640h1016l-89 357q-2 8 -14 17.5t-21 9.5h-768q-9 0 -21 -9.5t-14 -17.5z
+M1728 160q66 0 113 47t47 113t-47 113t-113 47t-113 -47t-47 -113t47 -113t113 -47z" />
+    <glyph glyph-name="_416" unicode="&#xf1bb;" 
+d="M1504 64q0 -26 -19 -45t-45 -19h-462q1 -17 6 -87.5t5 -108.5q0 -25 -18 -42.5t-43 -17.5h-320q-25 0 -43 17.5t-18 42.5q0 38 5 108.5t6 87.5h-462q-26 0 -45 19t-19 45t19 45l402 403h-229q-26 0 -45 19t-19 45t19 45l402 403h-197q-26 0 -45 19t-19 45t19 45l384 384
+q19 19 45 19t45 -19l384 -384q19 -19 19 -45t-19 -45t-45 -19h-197l402 -403q19 -19 19 -45t-19 -45t-45 -19h-229l402 -403q19 -19 19 -45z" />
+    <glyph glyph-name="_417" unicode="&#xf1bc;" 
+d="M1127 326q0 32 -30 51q-193 115 -447 115q-133 0 -287 -34q-42 -9 -42 -52q0 -20 13.5 -34.5t35.5 -14.5q5 0 37 8q132 27 243 27q226 0 397 -103q19 -11 33 -11q19 0 33 13.5t14 34.5zM1223 541q0 40 -35 61q-237 141 -548 141q-153 0 -303 -42q-48 -13 -48 -64
+q0 -25 17.5 -42.5t42.5 -17.5q7 0 37 8q122 33 251 33q279 0 488 -124q24 -13 38 -13q25 0 42.5 17.5t17.5 42.5zM1331 789q0 47 -40 70q-126 73 -293 110.5t-343 37.5q-204 0 -364 -47q-23 -7 -38.5 -25.5t-15.5 -48.5q0 -31 20.5 -52t51.5 -21q11 0 40 8q133 37 307 37
+q159 0 309.5 -34t253.5 -95q21 -12 40 -12q29 0 50.5 20.5t21.5 51.5zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_418" unicode="&#xf1bd;" horiz-adv-x="1024" 
+d="M1024 1233l-303 -582l24 -31h279v-415h-507l-44 -30l-142 -273l-30 -30h-301v303l303 583l-24 30h-279v415h507l44 30l142 273l30 30h301v-303z" />
+    <glyph glyph-name="_419" unicode="&#xf1be;" horiz-adv-x="2304" 
+d="M784 164l16 241l-16 523q-1 10 -7.5 17t-16.5 7q-9 0 -16 -7t-7 -17l-14 -523l14 -241q1 -10 7.5 -16.5t15.5 -6.5q22 0 24 23zM1080 193l11 211l-12 586q0 16 -13 24q-8 5 -16 5t-16 -5q-13 -8 -13 -24l-1 -6l-10 -579q0 -1 11 -236v-1q0 -10 6 -17q9 -11 23 -11
+q11 0 20 9q9 7 9 20zM35 533l20 -128l-20 -126q-2 -9 -9 -9t-9 9l-17 126l17 128q2 9 9 9t9 -9zM121 612l26 -207l-26 -203q-2 -9 -10 -9q-9 0 -9 10l-23 202l23 207q0 9 9 9q8 0 10 -9zM401 159zM213 650l25 -245l-25 -237q0 -11 -11 -11q-10 0 -12 11l-21 237l21 245
+q2 12 12 12q11 0 11 -12zM307 657l23 -252l-23 -244q-2 -13 -14 -13q-13 0 -13 13l-21 244l21 252q0 13 13 13q12 0 14 -13zM401 639l21 -234l-21 -246q-2 -16 -16 -16q-6 0 -10.5 4.5t-4.5 11.5l-20 246l20 234q0 6 4.5 10.5t10.5 4.5q14 0 16 -15zM784 164zM495 785
+l21 -380l-21 -246q0 -7 -5 -12.5t-12 -5.5q-16 0 -18 18l-18 246l18 380q2 18 18 18q7 0 12 -5.5t5 -12.5zM589 871l19 -468l-19 -244q0 -8 -5.5 -13.5t-13.5 -5.5q-18 0 -20 19l-16 244l16 468q2 19 20 19q8 0 13.5 -5.5t5.5 -13.5zM687 911l18 -506l-18 -242
+q-2 -21 -22 -21q-19 0 -21 21l-16 242l16 506q0 9 6.5 15.5t14.5 6.5q9 0 15 -6.5t7 -15.5zM1079 169v0v0v0zM881 915l15 -510l-15 -239q0 -10 -7.5 -17.5t-17.5 -7.5t-17 7t-8 18l-14 239l14 510q0 11 7.5 18t17.5 7t17.5 -7t7.5 -18zM980 896l14 -492l-14 -236
+q0 -11 -8 -19t-19 -8t-19 8t-9 19l-12 236l12 492q1 12 9 20t19 8t18.5 -8t8.5 -20zM1192 404l-14 -231v0q0 -13 -9 -22t-22 -9t-22 9t-10 22l-6 114l-6 117l12 636v3q2 15 12 24q9 7 20 7q8 0 15 -5q14 -8 16 -26zM2304 423q0 -117 -83 -199.5t-200 -82.5h-786
+q-13 2 -22 11t-9 22v899q0 23 28 33q85 34 181 34q195 0 338 -131.5t160 -323.5q53 22 110 22q117 0 200 -83t83 -201z" />
+    <glyph glyph-name="uniF1C0" unicode="&#xf1c0;" 
+d="M768 768q237 0 443 43t325 127v-170q0 -69 -103 -128t-280 -93.5t-385 -34.5t-385 34.5t-280 93.5t-103 128v170q119 -84 325 -127t443 -43zM768 0q237 0 443 43t325 127v-170q0 -69 -103 -128t-280 -93.5t-385 -34.5t-385 34.5t-280 93.5t-103 128v170q119 -84 325 -127
+t443 -43zM768 384q237 0 443 43t325 127v-170q0 -69 -103 -128t-280 -93.5t-385 -34.5t-385 34.5t-280 93.5t-103 128v170q119 -84 325 -127t443 -43zM768 1536q208 0 385 -34.5t280 -93.5t103 -128v-128q0 -69 -103 -128t-280 -93.5t-385 -34.5t-385 34.5t-280 93.5
+t-103 128v128q0 69 103 128t280 93.5t385 34.5z" />
+    <glyph glyph-name="uniF1C1" unicode="&#xf1c1;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M894 465q33 -26 84 -56q59 7 117 7q147 0 177 -49q16 -22 2 -52q0 -1 -1 -2l-2 -2v-1q-6 -38 -71 -38q-48 0 -115 20t-130 53q-221 -24 -392 -83q-153 -262 -242 -262q-15 0 -28 7l-24 12q-1 1 -6 5q-10 10 -6 36q9 40 56 91.5t132 96.5q14 9 23 -6q2 -2 2 -4q52 85 107 197
+q68 136 104 262q-24 82 -30.5 159.5t6.5 127.5q11 40 42 40h21h1q23 0 35 -15q18 -21 9 -68q-2 -6 -4 -8q1 -3 1 -8v-30q-2 -123 -14 -192q55 -164 146 -238zM318 54q52 24 137 158q-51 -40 -87.5 -84t-49.5 -74zM716 974q-15 -42 -2 -132q1 7 7 44q0 3 7 43q1 4 4 8
+q-1 1 -1 2q-1 2 -1 3q-1 22 -13 36q0 -1 -1 -2v-2zM592 313q135 54 284 81q-2 1 -13 9.5t-16 13.5q-76 67 -127 176q-27 -86 -83 -197q-30 -56 -45 -83zM1238 329q-24 24 -140 24q76 -28 124 -28q14 0 18 1q0 1 -2 3z" />
+    <glyph glyph-name="_422" unicode="&#xf1c2;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M233 768v-107h70l164 -661h159l128 485q7 20 10 46q2 16 2 24h4l3 -24q1 -3 3.5 -20t5.5 -26l128 -485h159l164 661h70v107h-300v-107h90l-99 -438q-5 -20 -7 -46l-2 -21h-4q0 3 -0.5 6.5t-1.5 8t-1 6.5q-1 5 -4 21t-5 25l-144 545h-114l-144 -545q-2 -9 -4.5 -24.5
+t-3.5 -21.5l-4 -21h-4l-2 21q-2 26 -7 46l-99 438h90v107h-300z" />
+    <glyph glyph-name="_423" unicode="&#xf1c3;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M429 106v-106h281v106h-75l103 161q5 7 10 16.5t7.5 13.5t3.5 4h2q1 -4 5 -10q2 -4 4.5 -7.5t6 -8t6.5 -8.5l107 -161h-76v-106h291v106h-68l-192 273l195 282h67v107h-279v-107h74l-103 -159q-4 -7 -10 -16.5t-9 -13.5l-2 -3h-2q-1 4 -5 10q-6 11 -17 23l-106 159h76v107
+h-290v-107h68l189 -272l-194 -283h-68z" />
+    <glyph glyph-name="_424" unicode="&#xf1c4;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M416 106v-106h327v106h-93v167h137q76 0 118 15q67 23 106.5 87t39.5 146q0 81 -37 141t-100 87q-48 19 -130 19h-368v-107h92v-555h-92zM769 386h-119v268h120q52 0 83 -18q56 -33 56 -115q0 -89 -62 -120q-31 -15 -78 -15z" />
+    <glyph glyph-name="_425" unicode="&#xf1c5;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M1280 320v-320h-1024v192l192 192l128 -128l384 384zM448 512q-80 0 -136 56t-56 136t56 136t136 56t136 -56t56 -136t-56 -136t-136 -56z" />
+    <glyph glyph-name="_426" unicode="&#xf1c6;" 
+d="M640 1152v128h-128v-128h128zM768 1024v128h-128v-128h128zM640 896v128h-128v-128h128zM768 768v128h-128v-128h128zM1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400
+v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-128v-128h-128v128h-512v-1536h1280zM781 593l107 -349q8 -27 8 -52q0 -83 -72.5 -137.5t-183.5 -54.5t-183.5 54.5t-72.5 137.5q0 25 8 52q21 63 120 396v128h128v-128h79
+q22 0 39 -13t23 -34zM640 128q53 0 90.5 19t37.5 45t-37.5 45t-90.5 19t-90.5 -19t-37.5 -45t37.5 -45t90.5 -19z" />
+    <glyph glyph-name="_427" unicode="&#xf1c7;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M620 686q20 -8 20 -30v-544q0 -22 -20 -30q-8 -2 -12 -2q-12 0 -23 9l-166 167h-131q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h131l166 167q16 15 35 7zM1037 -3q31 0 50 24q129 159 129 363t-129 363q-16 21 -43 24t-47 -14q-21 -17 -23.5 -43.5t14.5 -47.5
+q100 -123 100 -282t-100 -282q-17 -21 -14.5 -47.5t23.5 -42.5q18 -15 40 -15zM826 145q27 0 47 20q87 93 87 219t-87 219q-18 19 -45 20t-46 -17t-20 -44.5t18 -46.5q52 -57 52 -131t-52 -131q-19 -20 -18 -46.5t20 -44.5q20 -17 44 -17z" />
+    <glyph glyph-name="_428" unicode="&#xf1c8;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M768 768q52 0 90 -38t38 -90v-384q0 -52 -38 -90t-90 -38h-384q-52 0 -90 38t-38 90v384q0 52 38 90t90 38h384zM1260 766q20 -8 20 -30v-576q0 -22 -20 -30q-8 -2 -12 -2q-14 0 -23 9l-265 266v90l265 266q9 9 23 9q4 0 12 -2z" />
+    <glyph glyph-name="_429" unicode="&#xf1c9;" 
+d="M1468 1156q28 -28 48 -76t20 -88v-1152q0 -40 -28 -68t-68 -28h-1344q-40 0 -68 28t-28 68v1600q0 40 28 68t68 28h896q40 0 88 -20t76 -48zM1024 1400v-376h376q-10 29 -22 41l-313 313q-12 12 -41 22zM1408 -128v1024h-416q-40 0 -68 28t-28 68v416h-768v-1536h1280z
+M480 768q8 11 21 12.5t24 -6.5l51 -38q11 -8 12.5 -21t-6.5 -24l-182 -243l182 -243q8 -11 6.5 -24t-12.5 -21l-51 -38q-11 -8 -24 -6.5t-21 12.5l-226 301q-14 19 0 38zM1282 467q14 -19 0 -38l-226 -301q-8 -11 -21 -12.5t-24 6.5l-51 38q-11 8 -12.5 21t6.5 24l182 243
+l-182 243q-8 11 -6.5 24t12.5 21l51 38q11 8 24 6.5t21 -12.5zM662 6q-13 2 -20.5 13t-5.5 24l138 831q2 13 13 20.5t24 5.5l63 -10q13 -2 20.5 -13t5.5 -24l-138 -831q-2 -13 -13 -20.5t-24 -5.5z" />
+    <glyph glyph-name="_430" unicode="&#xf1ca;" 
+d="M1497 709v-198q-101 -23 -198 -23q-65 -136 -165.5 -271t-181.5 -215.5t-128 -106.5q-80 -45 -162 3q-28 17 -60.5 43.5t-85 83.5t-102.5 128.5t-107.5 184t-105.5 244t-91.5 314.5t-70.5 390h283q26 -218 70 -398.5t104.5 -317t121.5 -235.5t140 -195q169 169 287 406
+q-142 72 -223 220t-81 333q0 192 104 314.5t284 122.5q178 0 273 -105.5t95 -297.5q0 -159 -58 -286q-7 -1 -19.5 -3t-46 -2t-63 6t-62 25.5t-50.5 51.5q31 103 31 184q0 87 -29 132t-79 45q-53 0 -85 -49.5t-32 -140.5q0 -186 105 -293.5t267 -107.5q62 0 121 14z" />
+    <glyph glyph-name="_431" unicode="&#xf1cb;" horiz-adv-x="1792" 
+d="M216 367l603 -402v359l-334 223zM154 511l193 129l-193 129v-258zM973 -35l603 402l-269 180l-334 -223v-359zM896 458l272 182l-272 182l-272 -182zM485 733l334 223v359l-603 -402zM1445 640l193 -129v258zM1307 733l269 180l-603 402v-359zM1792 913v-546
+q0 -41 -34 -64l-819 -546q-21 -13 -43 -13t-43 13l-819 546q-34 23 -34 64v546q0 41 34 64l819 546q21 13 43 13t43 -13l819 -546q34 -23 34 -64z" />
+    <glyph glyph-name="_432" unicode="&#xf1cc;" horiz-adv-x="2048" 
+d="M1800 764q111 -46 179.5 -145.5t68.5 -221.5q0 -164 -118 -280.5t-285 -116.5q-4 0 -11.5 0.5t-10.5 0.5h-1209h-1h-2h-5q-170 10 -288 125.5t-118 280.5q0 110 55 203t147 147q-12 39 -12 82q0 115 82 196t199 81q95 0 172 -58q75 154 222.5 248t326.5 94
+q166 0 306 -80.5t221.5 -218.5t81.5 -301q0 -6 -0.5 -18t-0.5 -18zM468 498q0 -122 84 -193t208 -71q137 0 240 99q-16 20 -47.5 56.5t-43.5 50.5q-67 -65 -144 -65q-55 0 -93.5 33.5t-38.5 87.5q0 53 38.5 87t91.5 34q44 0 84.5 -21t73 -55t65 -75t69 -82t77 -75t97 -55
+t121.5 -21q121 0 204.5 71.5t83.5 190.5q0 121 -84 192t-207 71q-143 0 -241 -97l93 -108q66 64 142 64q52 0 92 -33t40 -84q0 -57 -37 -91.5t-94 -34.5q-43 0 -82.5 21t-72 55t-65.5 75t-69.5 82t-77.5 75t-96.5 55t-118.5 21q-122 0 -207 -70.5t-85 -189.5z" />
+    <glyph glyph-name="_433" unicode="&#xf1cd;" horiz-adv-x="1792" 
+d="M896 1536q182 0 348 -71t286 -191t191 -286t71 -348t-71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71zM896 1408q-190 0 -361 -90l194 -194q82 28 167 28t167 -28l194 194q-171 90 -361 90zM218 279l194 194
+q-28 82 -28 167t28 167l-194 194q-90 -171 -90 -361t90 -361zM896 -128q190 0 361 90l-194 194q-82 -28 -167 -28t-167 28l-194 -194q171 -90 361 -90zM896 256q159 0 271.5 112.5t112.5 271.5t-112.5 271.5t-271.5 112.5t-271.5 -112.5t-112.5 -271.5t112.5 -271.5
+t271.5 -112.5zM1380 473l194 -194q90 171 90 361t-90 361l-194 -194q28 -82 28 -167t-28 -167z" />
+    <glyph glyph-name="_434" unicode="&#xf1ce;" horiz-adv-x="1792" 
+d="M1760 640q0 -176 -68.5 -336t-184 -275.5t-275.5 -184t-336 -68.5t-336 68.5t-275.5 184t-184 275.5t-68.5 336q0 213 97 398.5t265 305.5t374 151v-228q-221 -45 -366.5 -221t-145.5 -406q0 -130 51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5
+t136.5 204t51 248.5q0 230 -145.5 406t-366.5 221v228q206 -31 374 -151t265 -305.5t97 -398.5z" />
+    <glyph glyph-name="uniF1D0" unicode="&#xf1d0;" horiz-adv-x="1792" 
+d="M19 662q8 217 116 406t305 318h5q0 -1 -1 -3q-8 -8 -28 -33.5t-52 -76.5t-60 -110.5t-44.5 -135.5t-14 -150.5t39 -157.5t108.5 -154q50 -50 102 -69.5t90.5 -11.5t69.5 23.5t47 32.5l16 16q39 51 53 116.5t6.5 122.5t-21 107t-26.5 80l-14 29q-10 25 -30.5 49.5t-43 41
+t-43.5 29.5t-35 19l-13 6l104 115q39 -17 78 -52t59 -61l19 -27q1 48 -18.5 103.5t-40.5 87.5l-20 31l161 183l160 -181q-33 -46 -52.5 -102.5t-22.5 -90.5l-4 -33q22 37 61.5 72.5t67.5 52.5l28 17l103 -115q-44 -14 -85 -50t-60 -65l-19 -29q-31 -56 -48 -133.5t-7 -170
+t57 -156.5q33 -45 77.5 -60.5t85 -5.5t76 26.5t57.5 33.5l21 16q60 53 96.5 115t48.5 121.5t10 121.5t-18 118t-37 107.5t-45.5 93t-45 72t-34.5 47.5l-13 17q-14 13 -7 13l10 -3q40 -29 62.5 -46t62 -50t64 -58t58.5 -65t55.5 -77t45.5 -88t38 -103t23.5 -117t10.5 -136
+q3 -259 -108 -465t-312 -321t-456 -115q-185 0 -351 74t-283.5 198t-184 293t-60.5 353z" />
+    <glyph glyph-name="uniF1D1" unicode="&#xf1d1;" horiz-adv-x="1792" 
+d="M874 -102v-66q-208 6 -385 109.5t-283 275.5l58 34q29 -49 73 -99l65 57q148 -168 368 -212l-17 -86q65 -12 121 -13zM276 428l-83 -28q22 -60 49 -112l-57 -33q-98 180 -98 385t98 385l57 -33q-30 -56 -49 -112l82 -28q-35 -100 -35 -212q0 -109 36 -212zM1528 251
+l58 -34q-106 -172 -283 -275.5t-385 -109.5v66q56 1 121 13l-17 86q220 44 368 212l65 -57q44 50 73 99zM1377 805l-233 -80q14 -42 14 -85t-14 -85l232 -80q-31 -92 -98 -169l-185 162q-57 -67 -147 -85l48 -241q-52 -10 -98 -10t-98 10l48 241q-90 18 -147 85l-185 -162
+q-67 77 -98 169l232 80q-14 42 -14 85t14 85l-233 80q33 93 99 169l185 -162q59 68 147 86l-48 240q44 10 98 10t98 -10l-48 -240q88 -18 147 -86l185 162q66 -76 99 -169zM874 1448v-66q-65 -2 -121 -13l17 -86q-220 -42 -368 -211l-65 56q-38 -42 -73 -98l-57 33
+q106 172 282 275.5t385 109.5zM1705 640q0 -205 -98 -385l-57 33q27 52 49 112l-83 28q36 103 36 212q0 112 -35 212l82 28q-19 56 -49 112l57 33q98 -180 98 -385zM1585 1063l-57 -33q-35 56 -73 98l-65 -56q-148 169 -368 211l17 86q-56 11 -121 13v66q209 -6 385 -109.5
+t282 -275.5zM1748 640q0 173 -67.5 331t-181.5 272t-272 181.5t-331 67.5t-331 -67.5t-272 -181.5t-181.5 -272t-67.5 -331t67.5 -331t181.5 -272t272 -181.5t331 -67.5t331 67.5t272 181.5t181.5 272t67.5 331zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71
+t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF1D2" unicode="&#xf1d2;" 
+d="M582 228q0 -66 -93 -66q-107 0 -107 63q0 64 98 64q102 0 102 -61zM546 694q0 -85 -74 -85q-77 0 -77 84q0 90 77 90q36 0 55 -25.5t19 -63.5zM712 769v125q-78 -29 -135 -29q-50 29 -110 29q-86 0 -145 -57t-59 -143q0 -50 29.5 -102t73.5 -67v-3q-38 -17 -38 -85
+q0 -53 41 -77v-3q-113 -37 -113 -139q0 -45 20 -78.5t54 -51t72 -25.5t81 -8q224 0 224 188q0 67 -48 99t-126 46q-27 5 -51.5 20.5t-24.5 39.5q0 44 49 52q77 15 122 70t45 134q0 24 -10 52q37 9 49 13zM771 350h137q-2 27 -2 82v387q0 46 2 69h-137q3 -23 3 -71v-392
+q0 -50 -3 -75zM1280 366v121q-30 -21 -68 -21q-53 0 -53 82v225h52q9 0 26.5 -1t26.5 -1v117h-105q0 82 3 102h-140q4 -24 4 -55v-47h-60v-117q36 3 37 3q3 0 11 -0.5t12 -0.5v-2h-2v-217q0 -37 2.5 -64t11.5 -56.5t24.5 -48.5t43.5 -31t66 -12q64 0 108 24zM924 1072
+q0 36 -24 63.5t-60 27.5t-60.5 -27t-24.5 -64q0 -36 25 -62.5t60 -26.5t59.5 27t24.5 62zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_438" unicode="&#xf1d3;" horiz-adv-x="1792" 
+d="M595 22q0 100 -165 100q-158 0 -158 -104q0 -101 172 -101q151 0 151 105zM536 777q0 61 -30 102t-89 41q-124 0 -124 -145q0 -135 124 -135q119 0 119 137zM805 1101v-202q-36 -12 -79 -22q16 -43 16 -84q0 -127 -73 -216.5t-197 -112.5q-40 -8 -59.5 -27t-19.5 -58
+q0 -31 22.5 -51.5t58 -32t78.5 -22t86 -25.5t78.5 -37.5t58 -64t22.5 -98.5q0 -304 -363 -304q-69 0 -130 12.5t-116 41t-87.5 82t-32.5 127.5q0 165 182 225v4q-67 41 -67 126q0 109 63 137v4q-72 24 -119.5 108.5t-47.5 165.5q0 139 95 231.5t235 92.5q96 0 178 -47
+q98 0 218 47zM1123 220h-222q4 45 4 134v609q0 94 -4 128h222q-4 -33 -4 -124v-613q0 -89 4 -134zM1724 442v-196q-71 -39 -174 -39q-62 0 -107 20t-70 50t-39.5 78t-18.5 92t-4 103v351h2v4q-7 0 -19 1t-18 1q-21 0 -59 -6v190h96v76q0 54 -6 89h227q-6 -41 -6 -165h171
+v-190q-15 0 -43.5 2t-42.5 2h-85v-365q0 -131 87 -131q61 0 109 33zM1148 1389q0 -58 -39 -101.5t-96 -43.5q-58 0 -98 43.5t-40 101.5q0 59 39.5 103t98.5 44q58 0 96.5 -44.5t38.5 -102.5z" />
+    <glyph glyph-name="_439" unicode="&#xf1d4;" 
+d="M809 532l266 499h-112l-157 -312q-24 -48 -44 -92l-42 92l-155 312h-120l263 -493v-324h101v318zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="uniF1D5" unicode="&#xf1d5;" horiz-adv-x="1280" 
+d="M842 964q0 -80 -57 -136.5t-136 -56.5q-60 0 -111 35q-62 -67 -115 -146q-247 -371 -202 -859q1 -22 -12.5 -38.5t-34.5 -18.5h-5q-20 0 -35 13.5t-17 33.5q-14 126 -3.5 247.5t29.5 217t54 186t69 155.5t74 125q61 90 132 165q-16 35 -16 77q0 80 56.5 136.5t136.5 56.5
+t136.5 -56.5t56.5 -136.5zM1223 953q0 -158 -78 -292t-212.5 -212t-292.5 -78q-64 0 -131 14q-21 5 -32.5 23.5t-6.5 39.5q5 20 23 31.5t39 7.5q51 -13 108 -13q97 0 186 38t153 102t102 153t38 186t-38 186t-102 153t-153 102t-186 38t-186 -38t-153 -102t-102 -153
+t-38 -186q0 -114 52 -218q10 -20 3.5 -40t-25.5 -30t-39.5 -3t-30.5 26q-64 123 -64 265q0 119 46.5 227t124.5 186t186 124t226 46q158 0 292.5 -78t212.5 -212.5t78 -292.5z" />
+    <glyph glyph-name="uniF1D6" unicode="&#xf1d6;" horiz-adv-x="1792" 
+d="M270 730q-8 19 -8 52q0 20 11 49t24 45q-1 22 7.5 53t22.5 43q0 139 92.5 288.5t217.5 209.5q139 66 324 66q133 0 266 -55q49 -21 90 -48t71 -56t55 -68t42 -74t32.5 -84.5t25.5 -89.5t22 -98l1 -5q55 -83 55 -150q0 -14 -9 -40t-9 -38q0 -1 1.5 -3.5t3.5 -5t2 -3.5
+q77 -114 120.5 -214.5t43.5 -208.5q0 -43 -19.5 -100t-55.5 -57q-9 0 -19.5 7.5t-19 17.5t-19 26t-16 26.5t-13.5 26t-9 17.5q-1 1 -3 1l-5 -4q-59 -154 -132 -223q20 -20 61.5 -38.5t69 -41.5t35.5 -65q-2 -4 -4 -16t-7 -18q-64 -97 -302 -97q-53 0 -110.5 9t-98 20
+t-104.5 30q-15 5 -23 7q-14 4 -46 4.5t-40 1.5q-41 -45 -127.5 -65t-168.5 -20q-35 0 -69 1.5t-93 9t-101 20.5t-74.5 40t-32.5 64q0 40 10 59.5t41 48.5q11 2 40.5 13t49.5 12q4 0 14 2q2 2 2 4l-2 3q-48 11 -108 105.5t-73 156.5l-5 3q-4 0 -12 -20q-18 -41 -54.5 -74.5
+t-77.5 -37.5h-1q-4 0 -6 4.5t-5 5.5q-23 54 -23 100q0 275 252 466z" />
+    <glyph glyph-name="uniF1D7" unicode="&#xf1d7;" horiz-adv-x="2048" 
+d="M580 1075q0 41 -25 66t-66 25q-43 0 -76 -25.5t-33 -65.5q0 -39 33 -64.5t76 -25.5q41 0 66 24.5t25 65.5zM1323 568q0 28 -25.5 50t-65.5 22q-27 0 -49.5 -22.5t-22.5 -49.5q0 -28 22.5 -50.5t49.5 -22.5q40 0 65.5 22t25.5 51zM1087 1075q0 41 -24.5 66t-65.5 25
+q-43 0 -76 -25.5t-33 -65.5q0 -39 33 -64.5t76 -25.5q41 0 65.5 24.5t24.5 65.5zM1722 568q0 28 -26 50t-65 22q-27 0 -49.5 -22.5t-22.5 -49.5q0 -28 22.5 -50.5t49.5 -22.5q39 0 65 22t26 51zM1456 965q-31 4 -70 4q-169 0 -311 -77t-223.5 -208.5t-81.5 -287.5
+q0 -78 23 -152q-35 -3 -68 -3q-26 0 -50 1.5t-55 6.5t-44.5 7t-54.5 10.5t-50 10.5l-253 -127l72 218q-290 203 -290 490q0 169 97.5 311t264 223.5t363.5 81.5q176 0 332.5 -66t262 -182.5t136.5 -260.5zM2048 404q0 -117 -68.5 -223.5t-185.5 -193.5l55 -181l-199 109
+q-150 -37 -218 -37q-169 0 -311 70.5t-223.5 191.5t-81.5 264t81.5 264t223.5 191.5t311 70.5q161 0 303 -70.5t227.5 -192t85.5 -263.5z" />
+    <glyph glyph-name="_443" unicode="&#xf1d8;" horiz-adv-x="1792" 
+d="M1764 1525q33 -24 27 -64l-256 -1536q-5 -29 -32 -45q-14 -8 -31 -8q-11 0 -24 5l-453 185l-242 -295q-18 -23 -49 -23q-13 0 -22 4q-19 7 -30.5 23.5t-11.5 36.5v349l864 1059l-1069 -925l-395 162q-37 14 -40 55q-2 40 32 59l1664 960q15 9 32 9q20 0 36 -11z" />
+    <glyph glyph-name="_444" unicode="&#xf1d9;" horiz-adv-x="1792" 
+d="M1764 1525q33 -24 27 -64l-256 -1536q-5 -29 -32 -45q-14 -8 -31 -8q-11 0 -24 5l-527 215l-298 -327q-18 -21 -47 -21q-14 0 -23 4q-19 7 -30 23.5t-11 36.5v452l-472 193q-37 14 -40 55q-3 39 32 59l1664 960q35 21 68 -2zM1422 26l221 1323l-1434 -827l336 -137
+l863 639l-478 -797z" />
+    <glyph glyph-name="_445" unicode="&#xf1da;" 
+d="M1536 640q0 -156 -61 -298t-164 -245t-245 -164t-298 -61q-172 0 -327 72.5t-264 204.5q-7 10 -6.5 22.5t8.5 20.5l137 138q10 9 25 9q16 -2 23 -12q73 -95 179 -147t225 -52q104 0 198.5 40.5t163.5 109.5t109.5 163.5t40.5 198.5t-40.5 198.5t-109.5 163.5
+t-163.5 109.5t-198.5 40.5q-98 0 -188 -35.5t-160 -101.5l137 -138q31 -30 14 -69q-17 -40 -59 -40h-448q-26 0 -45 19t-19 45v448q0 42 40 59q39 17 69 -14l130 -129q107 101 244.5 156.5t284.5 55.5q156 0 298 -61t245 -164t164 -245t61 -298zM896 928v-448q0 -14 -9 -23
+t-23 -9h-320q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h224v352q0 14 9 23t23 9h64q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="_446" unicode="&#xf1db;" 
+d="M768 1280q-130 0 -248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5t-51 248.5t-136.5 204t-204 136.5t-248.5 51zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103
+t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_447" unicode="&#xf1dc;" horiz-adv-x="1792" 
+d="M1682 -128q-44 0 -132.5 3.5t-133.5 3.5q-44 0 -132 -3.5t-132 -3.5q-24 0 -37 20.5t-13 45.5q0 31 17 46t39 17t51 7t45 15q33 21 33 140l-1 391q0 21 -1 31q-13 4 -50 4h-675q-38 0 -51 -4q-1 -10 -1 -31l-1 -371q0 -142 37 -164q16 -10 48 -13t57 -3.5t45 -15
+t20 -45.5q0 -26 -12.5 -48t-36.5 -22q-47 0 -139.5 3.5t-138.5 3.5q-43 0 -128 -3.5t-127 -3.5q-23 0 -35.5 21t-12.5 45q0 30 15.5 45t36 17.5t47.5 7.5t42 15q33 23 33 143l-1 57v813q0 3 0.5 26t0 36.5t-1.5 38.5t-3.5 42t-6.5 36.5t-11 31.5t-16 18q-15 10 -45 12t-53 2
+t-41 14t-18 45q0 26 12 48t36 22q46 0 138.5 -3.5t138.5 -3.5q42 0 126.5 3.5t126.5 3.5q25 0 37.5 -22t12.5 -48q0 -30 -17 -43.5t-38.5 -14.5t-49.5 -4t-43 -13q-35 -21 -35 -160l1 -320q0 -21 1 -32q13 -3 39 -3h699q25 0 38 3q1 11 1 32l1 320q0 139 -35 160
+q-18 11 -58.5 12.5t-66 13t-25.5 49.5q0 26 12.5 48t37.5 22q44 0 132 -3.5t132 -3.5q43 0 129 3.5t129 3.5q25 0 37.5 -22t12.5 -48q0 -30 -17.5 -44t-40 -14.5t-51.5 -3t-44 -12.5q-35 -23 -35 -161l1 -943q0 -119 34 -140q16 -10 46 -13.5t53.5 -4.5t41.5 -15.5t18 -44.5
+q0 -26 -12 -48t-36 -22z" />
+    <glyph glyph-name="_448" unicode="&#xf1dd;" horiz-adv-x="1280" 
+d="M1278 1347v-73q0 -29 -18.5 -61t-42.5 -32q-50 0 -54 -1q-26 -6 -32 -31q-3 -11 -3 -64v-1152q0 -25 -18 -43t-43 -18h-108q-25 0 -43 18t-18 43v1218h-143v-1218q0 -25 -17.5 -43t-43.5 -18h-108q-26 0 -43.5 18t-17.5 43v496q-147 12 -245 59q-126 58 -192 179
+q-64 117 -64 259q0 166 88 286q88 118 209 159q111 37 417 37h479q25 0 43 -18t18 -43z" />
+    <glyph glyph-name="_449" unicode="&#xf1de;" 
+d="M352 128v-128h-352v128h352zM704 256q26 0 45 -19t19 -45v-256q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h256zM864 640v-128h-864v128h864zM224 1152v-128h-224v128h224zM1536 128v-128h-736v128h736zM576 1280q26 0 45 -19t19 -45v-256
+q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h256zM1216 768q26 0 45 -19t19 -45v-256q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h256zM1536 640v-128h-224v128h224zM1536 1152v-128h-864v128h864z" />
+    <glyph glyph-name="uniF1E0" unicode="&#xf1e0;" 
+d="M1216 512q133 0 226.5 -93.5t93.5 -226.5t-93.5 -226.5t-226.5 -93.5t-226.5 93.5t-93.5 226.5q0 12 2 34l-360 180q-92 -86 -218 -86q-133 0 -226.5 93.5t-93.5 226.5t93.5 226.5t226.5 93.5q126 0 218 -86l360 180q-2 22 -2 34q0 133 93.5 226.5t226.5 93.5
+t226.5 -93.5t93.5 -226.5t-93.5 -226.5t-226.5 -93.5q-126 0 -218 86l-360 -180q2 -22 2 -34t-2 -34l360 -180q92 86 218 86z" />
+    <glyph glyph-name="_451" unicode="&#xf1e1;" 
+d="M1280 341q0 88 -62.5 151t-150.5 63q-84 0 -145 -58l-241 120q2 16 2 23t-2 23l241 120q61 -58 145 -58q88 0 150.5 63t62.5 151t-62.5 150.5t-150.5 62.5t-151 -62.5t-63 -150.5q0 -7 2 -23l-241 -120q-62 57 -145 57q-88 0 -150.5 -62.5t-62.5 -150.5t62.5 -150.5
+t150.5 -62.5q83 0 145 57l241 -120q-2 -16 -2 -23q0 -88 63 -150.5t151 -62.5t150.5 62.5t62.5 150.5zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_452" unicode="&#xf1e2;" horiz-adv-x="1792" 
+d="M571 947q-10 25 -34 35t-49 0q-108 -44 -191 -127t-127 -191q-10 -25 0 -49t35 -34q13 -5 24 -5q42 0 60 40q34 84 98.5 148.5t148.5 98.5q25 11 35 35t0 49zM1513 1303l46 -46l-244 -243l68 -68q19 -19 19 -45.5t-19 -45.5l-64 -64q89 -161 89 -343q0 -143 -55.5 -273.5
+t-150 -225t-225 -150t-273.5 -55.5t-273.5 55.5t-225 150t-150 225t-55.5 273.5t55.5 273.5t150 225t225 150t273.5 55.5q182 0 343 -89l64 64q19 19 45.5 19t45.5 -19l68 -68zM1521 1359q-10 -10 -22 -10q-13 0 -23 10l-91 90q-9 10 -9 23t9 23q10 9 23 9t23 -9l90 -91
+q10 -9 10 -22.5t-10 -22.5zM1751 1129q-11 -9 -23 -9t-23 9l-90 91q-10 9 -10 22.5t10 22.5q9 10 22.5 10t22.5 -10l91 -90q9 -10 9 -23t-9 -23zM1792 1312q0 -14 -9 -23t-23 -9h-96q-14 0 -23 9t-9 23t9 23t23 9h96q14 0 23 -9t9 -23zM1600 1504v-96q0 -14 -9 -23t-23 -9
+t-23 9t-9 23v96q0 14 9 23t23 9t23 -9t9 -23zM1751 1449l-91 -90q-10 -10 -22 -10q-13 0 -23 10q-10 9 -10 22.5t10 22.5l90 91q10 9 23 9t23 -9q9 -10 9 -23t-9 -23z" />
+    <glyph glyph-name="_453" unicode="&#xf1e3;" horiz-adv-x="1792" 
+d="M609 720l287 208l287 -208l-109 -336h-355zM896 1536q182 0 348 -71t286 -191t191 -286t71 -348t-71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71zM1515 186q149 203 149 454v3l-102 -89l-240 224l63 323
+l134 -12q-150 206 -389 282l53 -124l-287 -159l-287 159l53 124q-239 -76 -389 -282l135 12l62 -323l-240 -224l-102 89v-3q0 -251 149 -454l30 132l326 -40l139 -298l-116 -69q117 -39 240 -39t240 39l-116 69l139 298l326 40z" />
+    <glyph glyph-name="_454" unicode="&#xf1e4;" horiz-adv-x="1792" 
+d="M448 224v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM256 608v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM832 224v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23
+v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM640 608v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM66 768q-28 0 -47 19t-19 46v129h514v-129q0 -27 -19 -46t-46 -19h-383zM1216 224v-192q0 -14 -9 -23t-23 -9h-192
+q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1024 608v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1600 224v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23
+zM1408 608v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1792 1016v-13h-514v10q0 104 -382 102q-382 -1 -382 -102v-10h-514v13q0 17 8.5 43t34 64t65.5 75.5t110.5 76t160 67.5t224 47.5t293.5 18.5t293 -18.5t224 -47.5
+t160.5 -67.5t110.5 -76t65.5 -75.5t34 -64t8.5 -43zM1792 608v-192q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v192q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1792 962v-129q0 -27 -19 -46t-46 -19h-384q-27 0 -46 19t-19 46v129h514z" />
+    <glyph glyph-name="_455" unicode="&#xf1e5;" horiz-adv-x="1792" 
+d="M704 1216v-768q0 -26 -19 -45t-45 -19v-576q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v512l249 873q7 23 31 23h424zM1024 1216v-704h-256v704h256zM1792 320v-512q0 -26 -19 -45t-45 -19h-512q-26 0 -45 19t-19 45v576q-26 0 -45 19t-19 45v768h424q24 0 31 -23z
+M736 1504v-224h-352v224q0 14 9 23t23 9h288q14 0 23 -9t9 -23zM1408 1504v-224h-352v224q0 14 9 23t23 9h288q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="_456" unicode="&#xf1e6;" horiz-adv-x="1792" 
+d="M1755 1083q37 -38 37 -90.5t-37 -90.5l-401 -400l150 -150l-160 -160q-163 -163 -389.5 -186.5t-411.5 100.5l-362 -362h-181v181l362 362q-124 185 -100.5 411.5t186.5 389.5l160 160l150 -150l400 401q38 37 91 37t90 -37t37 -90.5t-37 -90.5l-400 -401l234 -234
+l401 400q38 37 91 37t90 -37z" />
+    <glyph glyph-name="_457" unicode="&#xf1e7;" horiz-adv-x="1792" 
+d="M873 796q0 -83 -63.5 -142.5t-152.5 -59.5t-152.5 59.5t-63.5 142.5q0 84 63.5 143t152.5 59t152.5 -59t63.5 -143zM1375 796q0 -83 -63 -142.5t-153 -59.5q-89 0 -152.5 59.5t-63.5 142.5q0 84 63.5 143t152.5 59q90 0 153 -59t63 -143zM1600 616v667q0 87 -32 123.5
+t-111 36.5h-1112q-83 0 -112.5 -34t-29.5 -126v-673q43 -23 88.5 -40t81 -28t81 -18.5t71 -11t70 -4t58.5 -0.5t56.5 2t44.5 2q68 1 95 -27q6 -6 10 -9q26 -25 61 -51q7 91 118 87q5 0 36.5 -1.5t43 -2t45.5 -1t53 1t54.5 4.5t61 8.5t62 13.5t67 19.5t67.5 27t72 34.5z
+M1763 621q-121 -149 -372 -252q84 -285 -23 -465q-66 -113 -183 -148q-104 -32 -182 15q-86 51 -82 164l-1 326v1q-8 2 -24.5 6t-23.5 5l-1 -338q4 -114 -83 -164q-79 -47 -183 -15q-117 36 -182 150q-105 180 -22 463q-251 103 -372 252q-25 37 -4 63t60 -1q4 -2 11.5 -7
+t10.5 -8v694q0 72 47 123t114 51h1257q67 0 114 -51t47 -123v-694l21 15q39 27 60 1t-4 -63z" />
+    <glyph glyph-name="_458" unicode="&#xf1e8;" horiz-adv-x="1792" 
+d="M896 1102v-434h-145v434h145zM1294 1102v-434h-145v434h145zM1294 342l253 254v795h-1194v-1049h326v-217l217 217h398zM1692 1536v-1013l-434 -434h-326l-217 -217h-217v217h-398v1158l109 289h1483z" />
+    <glyph glyph-name="_459" unicode="&#xf1e9;" 
+d="M773 217v-127q-1 -292 -6 -305q-12 -32 -51 -40q-54 -9 -181.5 38t-162.5 89q-13 15 -17 36q-1 12 4 26q4 10 34 47t181 216q1 0 60 70q15 19 39.5 24.5t49.5 -3.5q24 -10 37.5 -29t12.5 -42zM624 468q-3 -55 -52 -70l-120 -39q-275 -88 -292 -88q-35 2 -54 36
+q-12 25 -17 75q-8 76 1 166.5t30 124.5t56 32q13 0 202 -77q71 -29 115 -47l84 -34q23 -9 35.5 -30.5t11.5 -48.5zM1450 171q-7 -54 -91.5 -161t-135.5 -127q-37 -14 -63 7q-14 10 -184 287l-47 77q-14 21 -11.5 46t19.5 46q35 43 83 26q1 -1 119 -40q203 -66 242 -79.5
+t47 -20.5q28 -22 22 -61zM778 803q5 -102 -54 -122q-58 -17 -114 71l-378 598q-8 35 19 62q41 43 207.5 89.5t224.5 31.5q40 -10 49 -45q3 -18 22 -305.5t24 -379.5zM1440 695q3 -39 -26 -59q-15 -10 -329 -86q-67 -15 -91 -23l1 2q-23 -6 -46 4t-37 32q-30 47 0 87
+q1 1 75 102q125 171 150 204t34 39q28 19 65 2q48 -23 123 -133.5t81 -167.5v-3z" />
+    <glyph glyph-name="_460" unicode="&#xf1ea;" horiz-adv-x="2048" 
+d="M1024 1024h-384v-384h384v384zM1152 384v-128h-640v128h640zM1152 1152v-640h-640v640h640zM1792 384v-128h-512v128h512zM1792 640v-128h-512v128h512zM1792 896v-128h-512v128h512zM1792 1152v-128h-512v128h512zM256 192v960h-128v-960q0 -26 19 -45t45 -19t45 19
+t19 45zM1920 192v1088h-1536v-1088q0 -33 -11 -64h1483q26 0 45 19t19 45zM2048 1408v-1216q0 -80 -56 -136t-136 -56h-1664q-80 0 -136 56t-56 136v1088h256v128h1792z" />
+    <glyph glyph-name="_461" unicode="&#xf1eb;" horiz-adv-x="2048" 
+d="M1024 13q-20 0 -93 73.5t-73 93.5q0 32 62.5 54t103.5 22t103.5 -22t62.5 -54q0 -20 -73 -93.5t-93 -73.5zM1294 284q-2 0 -40 25t-101.5 50t-128.5 25t-128.5 -25t-101 -50t-40.5 -25q-18 0 -93.5 75t-75.5 93q0 13 10 23q78 77 196 121t233 44t233 -44t196 -121
+q10 -10 10 -23q0 -18 -75.5 -93t-93.5 -75zM1567 556q-11 0 -23 8q-136 105 -252 154.5t-268 49.5q-85 0 -170.5 -22t-149 -53t-113.5 -62t-79 -53t-31 -22q-17 0 -92 75t-75 93q0 12 10 22q132 132 320 205t380 73t380 -73t320 -205q10 -10 10 -22q0 -18 -75 -93t-92 -75z
+M1838 827q-11 0 -22 9q-179 157 -371.5 236.5t-420.5 79.5t-420.5 -79.5t-371.5 -236.5q-11 -9 -22 -9q-17 0 -92.5 75t-75.5 93q0 13 10 23q187 186 445 288t527 102t527 -102t445 -288q10 -10 10 -23q0 -18 -75.5 -93t-92.5 -75z" />
+    <glyph glyph-name="_462" unicode="&#xf1ec;" horiz-adv-x="1792" 
+d="M384 0q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM768 0q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM384 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5
+t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1152 0q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM768 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5
+t37.5 90.5zM384 768q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1152 384q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM768 768q0 53 -37.5 90.5t-90.5 37.5
+t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1536 0v384q0 52 -38 90t-90 38t-90 -38t-38 -90v-384q0 -52 38 -90t90 -38t90 38t38 90zM1152 768q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5z
+M1536 1088v256q0 26 -19 45t-45 19h-1280q-26 0 -45 -19t-19 -45v-256q0 -26 19 -45t45 -19h1280q26 0 45 19t19 45zM1536 768q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1664 1408v-1536q0 -52 -38 -90t-90 -38
+h-1408q-52 0 -90 38t-38 90v1536q0 52 38 90t90 38h1408q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_463" unicode="&#xf1ed;" 
+d="M1519 890q18 -84 -4 -204q-87 -444 -565 -444h-44q-25 0 -44 -16.5t-24 -42.5l-4 -19l-55 -346l-2 -15q-5 -26 -24.5 -42.5t-44.5 -16.5h-251q-21 0 -33 15t-9 36q9 56 26.5 168t26.5 168t27 167.5t27 167.5q5 37 43 37h131q133 -2 236 21q175 39 287 144q102 95 155 246
+q24 70 35 133q1 6 2.5 7.5t3.5 1t6 -3.5q79 -59 98 -162zM1347 1172q0 -107 -46 -236q-80 -233 -302 -315q-113 -40 -252 -42q0 -1 -90 -1l-90 1q-100 0 -118 -96q-2 -8 -85 -530q-1 -10 -12 -10h-295q-22 0 -36.5 16.5t-11.5 38.5l232 1471q5 29 27.5 48t51.5 19h598
+q34 0 97.5 -13t111.5 -32q107 -41 163.5 -123t56.5 -196z" />
+    <glyph glyph-name="_464" unicode="&#xf1ee;" horiz-adv-x="1792" 
+d="M441 864q33 0 52 -26q266 -364 362 -774h-446q-127 441 -367 749q-12 16 -3 33.5t29 17.5h373zM1000 507q-49 -199 -125 -393q-79 310 -256 594q40 221 44 449q211 -340 337 -650zM1099 1216q235 -324 384.5 -698.5t184.5 -773.5h-451q-41 665 -553 1472h435zM1792 640
+q0 -424 -101 -812q-67 560 -359 1083q-25 301 -106 584q-4 16 5.5 28.5t25.5 12.5h359q21 0 38.5 -13t22.5 -33q115 -409 115 -850z" />
+    <glyph glyph-name="uniF1F0" unicode="&#xf1f0;" horiz-adv-x="2304" 
+d="M1975 546h-138q14 37 66 179l3 9q4 10 10 26t9 26l12 -55zM531 611l-58 295q-11 54 -75 54h-268l-2 -13q311 -79 403 -336zM710 960l-162 -438l-17 89q-26 70 -85 129.5t-131 88.5l135 -510h175l261 641h-176zM849 318h166l104 642h-166zM1617 944q-69 27 -149 27
+q-123 0 -201 -59t-79 -153q-1 -102 145 -174q48 -23 67 -41t19 -39q0 -30 -30 -46t-69 -16q-86 0 -156 33l-22 11l-23 -144q74 -34 185 -34q130 -1 208.5 59t80.5 160q0 106 -140 174q-49 25 -71 42t-22 38q0 22 24.5 38.5t70.5 16.5q70 1 124 -24l15 -8zM2042 960h-128
+q-65 0 -87 -54l-246 -588h174l35 96h212q5 -22 20 -96h154zM2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_466" unicode="&#xf1f1;" horiz-adv-x="2304" 
+d="M1119 1195q-128 85 -281 85q-103 0 -197.5 -40.5t-162.5 -108.5t-108.5 -162t-40.5 -197q0 -104 40.5 -198t108.5 -162t162 -108.5t198 -40.5q153 0 281 85q-131 107 -178 265.5t0.5 316.5t177.5 265zM1152 1171q-126 -99 -172 -249.5t-0.5 -300.5t172.5 -249
+q127 99 172.5 249t-0.5 300.5t-172 249.5zM1185 1195q130 -107 177.5 -265.5t0.5 -317t-178 -264.5q128 -85 281 -85q104 0 198 40.5t162 108.5t108.5 162t40.5 198q0 103 -40.5 197t-108.5 162t-162.5 108.5t-197.5 40.5q-153 0 -281 -85zM1926 473h7v3h-17v-3h7v-17h3v17z
+M1955 456h4v20h-5l-6 -13l-6 13h-5v-20h3v15l6 -13h4l5 13v-15zM1947 16v-2h-2h-3v3h3h2v-1zM1947 7h3l-4 5h2l1 1q1 1 1 3t-1 3l-1 1h-3h-6v-13h3v5h1zM685 75q0 19 11 31t30 12q18 0 29 -12.5t11 -30.5q0 -19 -11 -31t-29 -12q-19 0 -30 12t-11 31zM1158 119q30 0 35 -32
+h-70q5 32 35 32zM1514 75q0 19 11 31t29 12t29.5 -12.5t11.5 -30.5q0 -19 -11 -31t-30 -12q-18 0 -29 12t-11 31zM1786 75q0 18 11.5 30.5t29.5 12.5t29.5 -12.5t11.5 -30.5q0 -19 -11.5 -31t-29.5 -12t-29.5 12.5t-11.5 30.5zM1944 3q-2 0 -4 1q-1 0 -3 2t-2 3q-1 2 -1 4
+q0 3 1 4q0 2 2 4l1 1q2 0 2 1q2 1 4 1q3 0 4 -1l4 -2l2 -4v-1q1 -2 1 -3l-1 -1v-3t-1 -1l-1 -2q-2 -2 -4 -2q-1 -1 -4 -1zM599 7h30v85q0 24 -14.5 38.5t-39.5 15.5q-32 0 -47 -24q-14 24 -45 24q-24 0 -39 -20v16h-30v-135h30v75q0 36 33 36q30 0 30 -36v-75h29v75
+q0 36 33 36q30 0 30 -36v-75zM765 7h29v68v67h-29v-16q-17 20 -43 20q-29 0 -48 -20t-19 -51t19 -51t48 -20q28 0 43 20v-17zM943 48q0 34 -47 40l-14 2q-23 4 -23 14q0 15 25 15q23 0 43 -11l12 24q-22 14 -55 14q-26 0 -41 -12t-15 -32q0 -33 47 -39l13 -2q24 -4 24 -14
+q0 -17 -31 -17q-25 0 -45 14l-13 -23q25 -17 58 -17q29 0 45.5 12t16.5 32zM1073 14l-8 25q-13 -7 -26 -7q-19 0 -19 22v61h48v27h-48v41h-30v-41h-28v-27h28v-61q0 -50 47 -50q21 0 36 10zM1159 146q-29 0 -48 -20t-19 -51q0 -32 19.5 -51.5t49.5 -19.5q33 0 55 19l-14 22
+q-18 -15 -39 -15q-34 0 -41 33h101v12q0 32 -18 51.5t-46 19.5zM1318 146q-23 0 -35 -20v16h-30v-135h30v76q0 35 29 35q10 0 18 -4l9 28q-9 4 -21 4zM1348 75q0 -31 19.5 -51t52.5 -20q29 0 48 16l-14 24q-18 -13 -35 -12q-18 0 -29.5 12t-11.5 31t11.5 31t29.5 12
+q19 0 35 -12l14 24q-20 16 -48 16q-33 0 -52.5 -20t-19.5 -51zM1593 7h30v68v67h-30v-16q-15 20 -42 20q-29 0 -48.5 -20t-19.5 -51t19.5 -51t48.5 -20q28 0 42 20v-17zM1726 146q-23 0 -35 -20v16h-29v-135h29v76q0 35 29 35q10 0 18 -4l9 28q-8 4 -21 4zM1866 7h29v68v122
+h-29v-71q-15 20 -43 20t-47.5 -20.5t-19.5 -50.5t19.5 -50.5t47.5 -20.5q29 0 43 20v-17zM1944 27l-2 -1h-3q-2 -1 -4 -3q-3 -1 -3 -4q-1 -2 -1 -6q0 -3 1 -5q0 -2 3 -4q2 -2 4 -3t5 -1q4 0 6 1q0 1 2 2l2 1q1 1 3 4q1 2 1 5q0 4 -1 6q-1 1 -3 4q0 1 -2 2l-2 1q-1 0 -3 0.5
+t-3 0.5zM2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_467" unicode="&#xf1f2;" horiz-adv-x="2304" 
+d="M313 759q0 -51 -36 -84q-29 -26 -89 -26h-17v220h17q61 0 89 -27q36 -31 36 -83zM2089 824q0 -52 -64 -52h-19v101h20q63 0 63 -49zM380 759q0 74 -50 120.5t-129 46.5h-95v-333h95q74 0 119 38q60 51 60 128zM410 593h65v333h-65v-333zM730 694q0 40 -20.5 62t-75.5 42
+q-29 10 -39.5 19t-10.5 23q0 16 13.5 26.5t34.5 10.5q29 0 53 -27l34 44q-41 37 -98 37q-44 0 -74 -27.5t-30 -67.5q0 -35 18 -55.5t64 -36.5q37 -13 45 -19q19 -12 19 -34q0 -20 -14 -33.5t-36 -13.5q-48 0 -71 44l-42 -40q44 -64 115 -64q51 0 83 30.5t32 79.5zM1008 604
+v77q-37 -37 -78 -37q-49 0 -80.5 32.5t-31.5 82.5q0 48 31.5 81.5t77.5 33.5q43 0 81 -38v77q-40 20 -80 20q-74 0 -125.5 -50.5t-51.5 -123.5t51 -123.5t125 -50.5q42 0 81 19zM2240 0v527q-65 -40 -144.5 -84t-237.5 -117t-329.5 -137.5t-417.5 -134.5t-504 -118h1569
+q26 0 45 19t19 45zM1389 757q0 75 -53 128t-128 53t-128 -53t-53 -128t53 -128t128 -53t128 53t53 128zM1541 584l144 342h-71l-90 -224l-89 224h-71l142 -342h35zM1714 593h184v56h-119v90h115v56h-115v74h119v57h-184v-333zM2105 593h80l-105 140q76 16 76 94q0 47 -31 73
+t-87 26h-97v-333h65v133h9zM2304 1274v-1268q0 -56 -38.5 -95t-93.5 -39h-2040q-55 0 -93.5 39t-38.5 95v1268q0 56 38.5 95t93.5 39h2040q55 0 93.5 -39t38.5 -95z" />
+    <glyph glyph-name="f1f3" unicode="&#xf1f3;" horiz-adv-x="2304" 
+d="M119 854h89l-45 108zM740 328l74 79l-70 79h-163v-49h142v-55h-142v-54h159zM898 406l99 -110v217zM1186 453q0 33 -40 33h-84v-69h83q41 0 41 36zM1475 457q0 29 -42 29h-82v-61h81q43 0 43 32zM1197 923q0 29 -42 29h-82v-60h81q43 0 43 31zM1656 854h89l-44 108z
+M699 1009v-271h-66v212l-94 -212h-57l-94 212v-212h-132l-25 60h-135l-25 -60h-70l116 271h96l110 -257v257h106l85 -184l77 184h108zM1255 453q0 -20 -5.5 -35t-14 -25t-22.5 -16.5t-26 -10t-31.5 -4.5t-31.5 -1t-32.5 0.5t-29.5 0.5v-91h-126l-80 90l-83 -90h-256v271h260
+l80 -89l82 89h207q109 0 109 -89zM964 794v-56h-217v271h217v-57h-152v-49h148v-55h-148v-54h152zM2304 235v-229q0 -55 -38.5 -94.5t-93.5 -39.5h-2040q-55 0 -93.5 39.5t-38.5 94.5v678h111l25 61h55l25 -61h218v46l19 -46h113l20 47v-47h541v99l10 1q10 0 10 -14v-86h279
+v23q23 -12 55 -18t52.5 -6.5t63 0.5t51.5 1l25 61h56l25 -61h227v58l34 -58h182v378h-180v-44l-25 44h-185v-44l-23 44h-249q-69 0 -109 -22v22h-172v-22q-24 22 -73 22h-628l-43 -97l-43 97h-198v-44l-22 44h-169l-78 -179v391q0 55 38.5 94.5t93.5 39.5h2040
+q55 0 93.5 -39.5t38.5 -94.5v-678h-120q-51 0 -81 -22v22h-177q-55 0 -78 -22v22h-316v-22q-31 22 -87 22h-209v-22q-23 22 -91 22h-234l-54 -58l-50 58h-349v-378h343l55 59l52 -59h211v89h21q59 0 90 13v-102h174v99h8q8 0 10 -2t2 -10v-87h529q57 0 88 24v-24h168
+q60 0 95 17zM1546 469q0 -23 -12 -43t-34 -29q25 -9 34 -26t9 -46v-54h-65v45q0 33 -12 43.5t-46 10.5h-69v-99h-65v271h154q48 0 77 -15t29 -58zM1269 936q0 -24 -12.5 -44t-33.5 -29q26 -9 34.5 -25.5t8.5 -46.5v-53h-65q0 9 0.5 26.5t0 25t-3 18.5t-8.5 16t-17.5 8.5
+t-29.5 3.5h-70v-98h-64v271l153 -1q49 0 78 -14.5t29 -57.5zM1798 327v-56h-216v271h216v-56h-151v-49h148v-55h-148v-54zM1372 1009v-271h-66v271h66zM2065 357q0 -86 -102 -86h-126v58h126q34 0 34 25q0 16 -17 21t-41.5 5t-49.5 3.5t-42 22.5t-17 55q0 39 26 60t66 21
+h130v-57h-119q-36 0 -36 -25q0 -16 17.5 -20.5t42 -4t49 -2.5t42 -21.5t17.5 -54.5zM2304 407v-101q-24 -35 -88 -35h-125v58h125q33 0 33 25q0 13 -12.5 19t-31 5.5t-40 2t-40 8t-31 24t-12.5 48.5q0 39 26.5 60t66.5 21h129v-57h-118q-36 0 -36 -25q0 -20 29 -22t68.5 -5
+t56.5 -26zM2139 1008v-270h-92l-122 203v-203h-132l-26 60h-134l-25 -60h-75q-129 0 -129 133q0 138 133 138h63v-59q-7 0 -28 1t-28.5 0.5t-23 -2t-21.5 -6.5t-14.5 -13.5t-11.5 -23t-3 -33.5q0 -38 13.5 -58t49.5 -20h29l92 213h97l109 -256v256h99l114 -188v188h66z" />
+    <glyph glyph-name="_469" unicode="&#xf1f4;" horiz-adv-x="2304" 
+d="M745 630q0 -37 -25.5 -61.5t-62.5 -24.5q-29 0 -46.5 16t-17.5 44q0 37 25 62.5t62 25.5q28 0 46.5 -16.5t18.5 -45.5zM1530 779q0 -42 -22 -57t-66 -15l-32 -1l17 107q2 11 13 11h18q22 0 35 -2t25 -12.5t12 -30.5zM1881 630q0 -36 -25.5 -61t-61.5 -25q-29 0 -47 16
+t-18 44q0 37 25 62.5t62 25.5q28 0 46.5 -16.5t18.5 -45.5zM513 801q0 59 -38.5 85.5t-100.5 26.5h-160q-19 0 -21 -19l-65 -408q-1 -6 3 -11t10 -5h76q20 0 22 19l18 110q1 8 7 13t15 6.5t17 1.5t19 -1t14 -1q86 0 135 48.5t49 134.5zM822 489l41 261q1 6 -3 11t-10 5h-76
+q-14 0 -17 -33q-27 40 -95 40q-72 0 -122.5 -54t-50.5 -127q0 -59 34.5 -94t92.5 -35q28 0 58 12t48 32q-4 -12 -4 -21q0 -16 13 -16h69q19 0 22 19zM1269 752q0 5 -4 9.5t-9 4.5h-77q-11 0 -18 -10l-106 -156l-44 150q-5 16 -22 16h-75q-5 0 -9 -4.5t-4 -9.5q0 -2 19.5 -59
+t42 -123t23.5 -70q-82 -112 -82 -120q0 -13 13 -13h77q11 0 18 10l255 368q2 2 2 7zM1649 801q0 59 -38.5 85.5t-100.5 26.5h-159q-20 0 -22 -19l-65 -408q-1 -6 3 -11t10 -5h82q12 0 16 13l18 116q1 8 7 13t15 6.5t17 1.5t19 -1t14 -1q86 0 135 48.5t49 134.5zM1958 489
+l41 261q1 6 -3 11t-10 5h-76q-14 0 -17 -33q-26 40 -95 40q-72 0 -122.5 -54t-50.5 -127q0 -59 34.5 -94t92.5 -35q29 0 59 12t47 32q0 -1 -2 -9t-2 -12q0 -16 13 -16h69q19 0 22 19zM2176 898v1q0 14 -13 14h-74q-11 0 -13 -11l-65 -416l-1 -2q0 -5 4 -9.5t10 -4.5h66
+q19 0 21 19zM392 764q-5 -35 -26 -46t-60 -11l-33 -1l17 107q2 11 13 11h19q40 0 58 -11.5t12 -48.5zM2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_470" unicode="&#xf1f5;" horiz-adv-x="2304" 
+d="M1597 633q0 -69 -21 -106q-19 -35 -52 -35q-23 0 -41 9v224q29 30 57 30q57 0 57 -122zM2035 669h-110q6 98 56 98q51 0 54 -98zM476 534q0 59 -33 91.5t-101 57.5q-36 13 -52 24t-16 25q0 26 38 26q58 0 124 -33l18 112q-67 32 -149 32q-77 0 -123 -38q-48 -39 -48 -109
+q0 -58 32.5 -90.5t99.5 -56.5q39 -14 54.5 -25.5t15.5 -27.5q0 -31 -48 -31q-29 0 -70 12.5t-72 30.5l-18 -113q72 -41 168 -41q81 0 129 37q51 41 51 117zM771 749l19 111h-96v135l-129 -21l-18 -114l-46 -8l-17 -103h62v-219q0 -84 44 -120q38 -30 111 -30q32 0 79 11v118
+q-32 -7 -44 -7q-42 0 -42 50v197h77zM1087 724v139q-15 3 -28 3q-32 0 -55.5 -16t-33.5 -46l-10 56h-131v-471h150v306q26 31 82 31q16 0 26 -2zM1124 389h150v471h-150v-471zM1746 638q0 122 -45 179q-40 52 -111 52q-64 0 -117 -56l-8 47h-132v-645l150 25v151
+q36 -11 68 -11q83 0 134 56q61 65 61 202zM1278 986q0 33 -23 56t-56 23t-56 -23t-23 -56t23 -56.5t56 -23.5t56 23.5t23 56.5zM2176 629q0 113 -48 176q-50 64 -144 64q-96 0 -151.5 -66t-55.5 -180q0 -128 63 -188q55 -55 161 -55q101 0 160 40l-16 103q-57 -31 -128 -31
+q-43 0 -63 19q-23 19 -28 66h248q2 14 2 52zM2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_471" unicode="&#xf1f6;" horiz-adv-x="2048" 
+d="M1558 684q61 -356 298 -556q0 -52 -38 -90t-90 -38h-448q0 -106 -75 -181t-181 -75t-180.5 74.5t-75.5 180.5zM1024 -176q16 0 16 16t-16 16q-59 0 -101.5 42.5t-42.5 101.5q0 16 -16 16t-16 -16q0 -73 51.5 -124.5t124.5 -51.5zM2026 1424q8 -10 7.5 -23.5t-10.5 -22.5
+l-1872 -1622q-10 -8 -23.5 -7t-21.5 11l-84 96q-8 10 -7.5 23.5t10.5 21.5l186 161q-19 32 -19 66q50 42 91 88t85 119.5t74.5 158.5t50 206t19.5 260q0 152 117 282.5t307 158.5q-8 19 -8 39q0 40 28 68t68 28t68 -28t28 -68q0 -20 -8 -39q124 -18 219 -82.5t148 -157.5
+l418 363q10 8 23.5 7t21.5 -11z" />
+    <glyph glyph-name="_472" unicode="&#xf1f7;" horiz-adv-x="2048" 
+d="M1040 -160q0 16 -16 16q-59 0 -101.5 42.5t-42.5 101.5q0 16 -16 16t-16 -16q0 -73 51.5 -124.5t124.5 -51.5q16 0 16 16zM503 315l877 760q-42 88 -132.5 146.5t-223.5 58.5q-93 0 -169.5 -31.5t-121.5 -80.5t-69 -103t-24 -105q0 -384 -137 -645zM1856 128
+q0 -52 -38 -90t-90 -38h-448q0 -106 -75 -181t-181 -75t-180.5 74.5t-75.5 180.5l149 129h757q-166 187 -227 459l111 97q61 -356 298 -556zM1942 1520l84 -96q8 -10 7.5 -23.5t-10.5 -22.5l-1872 -1622q-10 -8 -23.5 -7t-21.5 11l-84 96q-8 10 -7.5 23.5t10.5 21.5l186 161
+q-19 32 -19 66q50 42 91 88t85 119.5t74.5 158.5t50 206t19.5 260q0 152 117 282.5t307 158.5q-8 19 -8 39q0 40 28 68t68 28t68 -28t28 -68q0 -20 -8 -39q124 -18 219 -82.5t148 -157.5l418 363q10 8 23.5 7t21.5 -11z" />
+    <glyph glyph-name="_473" unicode="&#xf1f8;" horiz-adv-x="1408" 
+d="M512 160v704q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-704q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM768 160v704q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-704q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1024 160v704q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-704
+q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM480 1152h448l-48 117q-7 9 -17 11h-317q-10 -2 -17 -11zM1408 1120v-64q0 -14 -9 -23t-23 -9h-96v-948q0 -83 -47 -143.5t-113 -60.5h-832q-66 0 -113 58.5t-47 141.5v952h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h309l70 167
+q15 37 54 63t79 26h320q40 0 79 -26t54 -63l70 -167h309q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="_474" unicode="&#xf1f9;" 
+d="M1150 462v-109q0 -50 -36.5 -89t-94 -60.5t-118 -32.5t-117.5 -11q-205 0 -342.5 139t-137.5 346q0 203 136 339t339 136q34 0 75.5 -4.5t93 -18t92.5 -34t69 -56.5t28 -81v-109q0 -16 -16 -16h-118q-16 0 -16 16v70q0 43 -65.5 67.5t-137.5 24.5q-140 0 -228.5 -91.5
+t-88.5 -237.5q0 -151 91.5 -249.5t233.5 -98.5q68 0 138 24t70 66v70q0 7 4.5 11.5t10.5 4.5h119q6 0 11 -4.5t5 -11.5zM768 1280q-130 0 -248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5
+t-51 248.5t-136.5 204t-204 136.5t-248.5 51zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_475" unicode="&#xf1fa;" 
+d="M972 761q0 108 -53.5 169t-147.5 61q-63 0 -124 -30.5t-110 -84.5t-79.5 -137t-30.5 -180q0 -112 53.5 -173t150.5 -61q96 0 176 66.5t122.5 166t42.5 203.5zM1536 640q0 -111 -37 -197t-98.5 -135t-131.5 -74.5t-145 -27.5q-6 0 -15.5 -0.5t-16.5 -0.5q-95 0 -142 53
+q-28 33 -33 83q-52 -66 -131.5 -110t-173.5 -44q-161 0 -249.5 95.5t-88.5 269.5q0 157 66 290t179 210.5t246 77.5q87 0 155 -35.5t106 -99.5l2 19l11 56q1 6 5.5 12t9.5 6h118q5 0 13 -11q5 -5 3 -16l-120 -614q-5 -24 -5 -48q0 -39 12.5 -52t44.5 -13q28 1 57 5.5t73 24
+t77 50t57 89.5t24 137q0 292 -174 466t-466 174q-130 0 -248.5 -51t-204 -136.5t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51q228 0 405 144q11 9 24 8t21 -12l41 -49q8 -12 7 -24q-2 -13 -12 -22q-102 -83 -227.5 -128t-258.5 -45q-156 0 -298 61
+t-245 164t-164 245t-61 298t61 298t164 245t245 164t298 61q344 0 556 -212t212 -556z" />
+    <glyph glyph-name="_476" unicode="&#xf1fb;" horiz-adv-x="1792" 
+d="M1698 1442q94 -94 94 -226.5t-94 -225.5l-225 -223l104 -104q10 -10 10 -23t-10 -23l-210 -210q-10 -10 -23 -10t-23 10l-105 105l-603 -603q-37 -37 -90 -37h-203l-256 -128l-64 64l128 256v203q0 53 37 90l603 603l-105 105q-10 10 -10 23t10 23l210 210q10 10 23 10
+t23 -10l104 -104l223 225q93 94 225.5 94t226.5 -94zM512 64l576 576l-192 192l-576 -576v-192h192z" />
+    <glyph glyph-name="f1fc" unicode="&#xf1fc;" horiz-adv-x="1792" 
+d="M1615 1536q70 0 122.5 -46.5t52.5 -116.5q0 -63 -45 -151q-332 -629 -465 -752q-97 -91 -218 -91q-126 0 -216.5 92.5t-90.5 219.5q0 128 92 212l638 579q59 54 130 54zM706 502q39 -76 106.5 -130t150.5 -76l1 -71q4 -213 -129.5 -347t-348.5 -134q-123 0 -218 46.5
+t-152.5 127.5t-86.5 183t-29 220q7 -5 41 -30t62 -44.5t59 -36.5t46 -17q41 0 55 37q25 66 57.5 112.5t69.5 76t88 47.5t103 25.5t125 10.5z" />
+    <glyph glyph-name="_478" unicode="&#xf1fd;" horiz-adv-x="1792" 
+d="M1792 128v-384h-1792v384q45 0 85 14t59 27.5t47 37.5q30 27 51.5 38t56.5 11q24 0 44 -7t31 -15t33 -27q29 -25 47 -38t58 -27t86 -14q45 0 85 14.5t58 27t48 37.5q21 19 32.5 27t31 15t43.5 7q35 0 56.5 -11t51.5 -38q28 -24 47 -37.5t59 -27.5t85 -14t85 14t59 27.5
+t47 37.5q30 27 51.5 38t56.5 11q34 0 55.5 -11t51.5 -38q28 -24 47 -37.5t59 -27.5t85 -14zM1792 448v-192q-24 0 -44 7t-31 15t-33 27q-29 25 -47 38t-58 27t-85 14q-46 0 -86 -14t-58 -27t-47 -38q-22 -19 -33 -27t-31 -15t-44 -7q-35 0 -56.5 11t-51.5 38q-29 25 -47 38
+t-58 27t-86 14q-45 0 -85 -14.5t-58 -27t-48 -37.5q-21 -19 -32.5 -27t-31 -15t-43.5 -7q-35 0 -56.5 11t-51.5 38q-28 24 -47 37.5t-59 27.5t-85 14q-46 0 -86 -14t-58 -27t-47 -38q-30 -27 -51.5 -38t-56.5 -11v192q0 80 56 136t136 56h64v448h256v-448h256v448h256v-448
+h256v448h256v-448h64q80 0 136 -56t56 -136zM512 1312q0 -77 -36 -118.5t-92 -41.5q-53 0 -90.5 37.5t-37.5 90.5q0 29 9.5 51t23.5 34t31 28t31 31.5t23.5 44.5t9.5 67q38 0 83 -74t45 -150zM1024 1312q0 -77 -36 -118.5t-92 -41.5q-53 0 -90.5 37.5t-37.5 90.5
+q0 29 9.5 51t23.5 34t31 28t31 31.5t23.5 44.5t9.5 67q38 0 83 -74t45 -150zM1536 1312q0 -77 -36 -118.5t-92 -41.5q-53 0 -90.5 37.5t-37.5 90.5q0 29 9.5 51t23.5 34t31 28t31 31.5t23.5 44.5t9.5 67q38 0 83 -74t45 -150z" />
+    <glyph glyph-name="_479" unicode="&#xf1fe;" horiz-adv-x="2048" 
+d="M2048 0v-128h-2048v1536h128v-1408h1920zM1664 1024l256 -896h-1664v576l448 576l576 -576z" />
+    <glyph glyph-name="_480" unicode="&#xf200;" horiz-adv-x="1792" 
+d="M768 646l546 -546q-106 -108 -247.5 -168t-298.5 -60q-209 0 -385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103v-762zM955 640h773q0 -157 -60 -298.5t-168 -247.5zM1664 768h-768v768q209 0 385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_481" unicode="&#xf201;" horiz-adv-x="2048" 
+d="M2048 0v-128h-2048v1536h128v-1408h1920zM1920 1248v-435q0 -21 -19.5 -29.5t-35.5 7.5l-121 121l-633 -633q-10 -10 -23 -10t-23 10l-233 233l-416 -416l-192 192l585 585q10 10 23 10t23 -10l233 -233l464 464l-121 121q-16 16 -7.5 35.5t29.5 19.5h435q14 0 23 -9
+t9 -23z" />
+    <glyph glyph-name="_482" unicode="&#xf202;" horiz-adv-x="1792" 
+d="M1292 832q0 -6 10 -41q10 -29 25 -49.5t41 -34t44 -20t55 -16.5q325 -91 325 -332q0 -146 -105.5 -242.5t-254.5 -96.5q-59 0 -111.5 18.5t-91.5 45.5t-77 74.5t-63 87.5t-53.5 103.5t-43.5 103t-39.5 106.5t-35.5 95q-32 81 -61.5 133.5t-73.5 96.5t-104 64t-142 20
+q-96 0 -183 -55.5t-138 -144.5t-51 -185q0 -160 106.5 -279.5t263.5 -119.5q177 0 258 95q56 63 83 116l84 -152q-15 -34 -44 -70l1 -1q-131 -152 -388 -152q-147 0 -269.5 79t-190.5 207.5t-68 274.5q0 105 43.5 206t116 176.5t172 121.5t204.5 46q87 0 159 -19t123.5 -50
+t95 -80t72.5 -99t58.5 -117t50.5 -124.5t50 -130.5t55 -127q96 -200 233 -200q81 0 138.5 48.5t57.5 128.5q0 42 -19 72t-50.5 46t-72.5 31.5t-84.5 27t-87.5 34t-81 52t-65 82t-39 122.5q-3 16 -3 33q0 110 87.5 192t198.5 78q78 -3 120.5 -14.5t90.5 -53.5h-1
+q12 -11 23 -24.5t26 -36t19 -27.5l-129 -99q-26 49 -54 70v1q-23 21 -97 21q-49 0 -84 -33t-35 -83z" />
+    <glyph glyph-name="_483" unicode="&#xf203;" 
+d="M1432 484q0 173 -234 239q-35 10 -53 16.5t-38 25t-29 46.5q0 2 -2 8.5t-3 12t-1 7.5q0 36 24.5 59.5t60.5 23.5q54 0 71 -15h-1q20 -15 39 -51l93 71q-39 54 -49 64q-33 29 -67.5 39t-85.5 10q-80 0 -142 -57.5t-62 -137.5q0 -7 2 -23q16 -96 64.5 -140t148.5 -73
+q29 -8 49 -15.5t45 -21.5t38.5 -34.5t13.5 -46.5v-5q1 -58 -40.5 -93t-100.5 -35q-97 0 -167 144q-23 47 -51.5 121.5t-48 125.5t-54 110.5t-74 95.5t-103.5 60.5t-147 24.5q-101 0 -192 -56t-144 -148t-50 -192v-1q4 -108 50.5 -199t133.5 -147.5t196 -56.5q186 0 279 110
+q20 27 31 51l-60 109q-42 -80 -99 -116t-146 -36q-115 0 -191 87t-76 204q0 105 82 189t186 84q112 0 170 -53.5t104 -172.5q8 -21 25.5 -68.5t28.5 -76.5t31.5 -74.5t38.5 -74t45.5 -62.5t55.5 -53.5t66 -33t80 -13.5q107 0 183 69.5t76 174.5zM1536 1120v-960
+q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_484" unicode="&#xf204;" horiz-adv-x="2048" 
+d="M1152 640q0 104 -40.5 198.5t-109.5 163.5t-163.5 109.5t-198.5 40.5t-198.5 -40.5t-163.5 -109.5t-109.5 -163.5t-40.5 -198.5t40.5 -198.5t109.5 -163.5t163.5 -109.5t198.5 -40.5t198.5 40.5t163.5 109.5t109.5 163.5t40.5 198.5zM1920 640q0 104 -40.5 198.5
+t-109.5 163.5t-163.5 109.5t-198.5 40.5h-386q119 -90 188.5 -224t69.5 -288t-69.5 -288t-188.5 -224h386q104 0 198.5 40.5t163.5 109.5t109.5 163.5t40.5 198.5zM2048 640q0 -130 -51 -248.5t-136.5 -204t-204 -136.5t-248.5 -51h-768q-130 0 -248.5 51t-204 136.5
+t-136.5 204t-51 248.5t51 248.5t136.5 204t204 136.5t248.5 51h768q130 0 248.5 -51t204 -136.5t136.5 -204t51 -248.5z" />
+    <glyph glyph-name="_485" unicode="&#xf205;" horiz-adv-x="2048" 
+d="M0 640q0 130 51 248.5t136.5 204t204 136.5t248.5 51h768q130 0 248.5 -51t204 -136.5t136.5 -204t51 -248.5t-51 -248.5t-136.5 -204t-204 -136.5t-248.5 -51h-768q-130 0 -248.5 51t-204 136.5t-136.5 204t-51 248.5zM1408 128q104 0 198.5 40.5t163.5 109.5
+t109.5 163.5t40.5 198.5t-40.5 198.5t-109.5 163.5t-163.5 109.5t-198.5 40.5t-198.5 -40.5t-163.5 -109.5t-109.5 -163.5t-40.5 -198.5t40.5 -198.5t109.5 -163.5t163.5 -109.5t198.5 -40.5z" />
+    <glyph glyph-name="_486" unicode="&#xf206;" horiz-adv-x="2304" 
+d="M762 384h-314q-40 0 -57.5 35t6.5 67l188 251q-65 31 -137 31q-132 0 -226 -94t-94 -226t94 -226t226 -94q115 0 203 72.5t111 183.5zM576 512h186q-18 85 -75 148zM1056 512l288 384h-480l-99 -132q105 -103 126 -252h165zM2176 448q0 132 -94 226t-226 94
+q-60 0 -121 -24l174 -260q15 -23 10 -49t-27 -40q-15 -11 -36 -11q-35 0 -53 29l-174 260q-93 -95 -93 -225q0 -132 94 -226t226 -94t226 94t94 226zM2304 448q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 97 39.5 183.5t109.5 149.5l-65 98l-353 -469
+q-18 -26 -51 -26h-197q-23 -164 -149 -274t-294 -110q-185 0 -316.5 131.5t-131.5 316.5t131.5 316.5t316.5 131.5q114 0 215 -55l137 183h-224q-26 0 -45 19t-19 45t19 45t45 19h384v-128h435l-85 128h-222q-26 0 -45 19t-19 45t19 45t45 19h256q33 0 53 -28l267 -400
+q91 44 192 44q185 0 316.5 -131.5t131.5 -316.5z" />
+    <glyph glyph-name="_487" unicode="&#xf207;" 
+d="M384 320q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1408 320q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1362 716l-72 384q-5 23 -22.5 37.5t-40.5 14.5
+h-918q-23 0 -40.5 -14.5t-22.5 -37.5l-72 -384q-5 -30 14 -53t49 -23h1062q30 0 49 23t14 53zM1136 1328q0 20 -14 34t-34 14h-640q-20 0 -34 -14t-14 -34t14 -34t34 -14h640q20 0 34 14t14 34zM1536 603v-603h-128v-128q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5
+t-37.5 90.5v128h-768v-128q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5v128h-128v603q0 112 25 223l103 454q9 78 97.5 137t230 89t312.5 30t312.5 -30t230 -89t97.5 -137l105 -454q23 -102 23 -223z" />
+    <glyph glyph-name="_488" unicode="&#xf208;" horiz-adv-x="2048" 
+d="M1463 704q0 -35 -25 -60.5t-61 -25.5h-702q-36 0 -61 25.5t-25 60.5t25 60.5t61 25.5h702q36 0 61 -25.5t25 -60.5zM1677 704q0 86 -23 170h-982q-36 0 -61 25t-25 60q0 36 25 61t61 25h908q-88 143 -235 227t-320 84q-177 0 -327.5 -87.5t-238 -237.5t-87.5 -327
+q0 -86 23 -170h982q36 0 61 -25t25 -60q0 -36 -25 -61t-61 -25h-908q88 -143 235.5 -227t320.5 -84q132 0 253 51.5t208 139t139 208t52 253.5zM2048 959q0 -35 -25 -60t-61 -25h-131q17 -85 17 -170q0 -167 -65.5 -319.5t-175.5 -263t-262.5 -176t-319.5 -65.5
+q-246 0 -448.5 133t-301.5 350h-189q-36 0 -61 25t-25 61q0 35 25 60t61 25h132q-17 85 -17 170q0 167 65.5 319.5t175.5 263t262.5 176t320.5 65.5q245 0 447.5 -133t301.5 -350h188q36 0 61 -25t25 -61z" />
+    <glyph glyph-name="_489" unicode="&#xf209;" horiz-adv-x="1280" 
+d="M953 1158l-114 -328l117 -21q165 451 165 518q0 56 -38 56q-57 0 -130 -225zM654 471l33 -88q37 42 71 67l-33 5.5t-38.5 7t-32.5 8.5zM362 1367q0 -98 159 -521q17 10 49 10q15 0 75 -5l-121 351q-75 220 -123 220q-19 0 -29 -17.5t-10 -37.5zM283 608q0 -36 51.5 -119
+t117.5 -153t100 -70q14 0 25.5 13t11.5 27q0 24 -32 102q-13 32 -32 72t-47.5 89t-61.5 81t-62 32q-20 0 -45.5 -27t-25.5 -47zM125 273q0 -41 25 -104q59 -145 183.5 -227t281.5 -82q227 0 382 170q152 169 152 427q0 43 -1 67t-11.5 62t-30.5 56q-56 49 -211.5 75.5
+t-270.5 26.5q-37 0 -49 -11q-12 -5 -12 -35q0 -34 21.5 -60t55.5 -40t77.5 -23.5t87.5 -11.5t85 -4t70 0h23q24 0 40 -19q15 -19 19 -55q-28 -28 -96 -54q-61 -22 -93 -46q-64 -46 -108.5 -114t-44.5 -137q0 -31 18.5 -88.5t18.5 -87.5l-3 -12q-4 -12 -4 -14
+q-137 10 -146 216q-8 -2 -41 -2q2 -7 2 -21q0 -53 -40.5 -89.5t-94.5 -36.5q-82 0 -166.5 78t-84.5 159q0 34 33 67q52 -64 60 -76q77 -104 133 -104q12 0 26.5 8.5t14.5 20.5q0 34 -87.5 145t-116.5 111q-43 0 -70 -44.5t-27 -90.5zM11 264q0 101 42.5 163t136.5 88
+q-28 74 -28 104q0 62 61 123t122 61q29 0 70 -15q-163 462 -163 567q0 80 41 130.5t119 50.5q131 0 325 -581q6 -17 8 -23q6 16 29 79.5t43.5 118.5t54 127.5t64.5 123t70.5 86.5t76.5 36q71 0 112 -49t41 -122q0 -108 -159 -550q61 -15 100.5 -46t58.5 -78t26 -93.5
+t7 -110.5q0 -150 -47 -280t-132 -225t-211 -150t-278 -55q-111 0 -223 42q-149 57 -258 191.5t-109 286.5z" />
+    <glyph glyph-name="_490" unicode="&#xf20a;" horiz-adv-x="2048" 
+d="M785 528h207q-14 -158 -98.5 -248.5t-214.5 -90.5q-162 0 -254.5 116t-92.5 316q0 194 93 311.5t233 117.5q148 0 232 -87t97 -247h-203q-5 64 -35.5 99t-81.5 35q-57 0 -88.5 -60.5t-31.5 -177.5q0 -48 5 -84t18 -69.5t40 -51.5t66 -18q95 0 109 139zM1497 528h206
+q-14 -158 -98 -248.5t-214 -90.5q-162 0 -254.5 116t-92.5 316q0 194 93 311.5t233 117.5q148 0 232 -87t97 -247h-204q-4 64 -35 99t-81 35q-57 0 -88.5 -60.5t-31.5 -177.5q0 -48 5 -84t18 -69.5t39.5 -51.5t65.5 -18q49 0 76.5 38t33.5 101zM1856 647q0 207 -15.5 307
+t-60.5 161q-6 8 -13.5 14t-21.5 15t-16 11q-86 63 -697 63q-625 0 -710 -63q-5 -4 -17.5 -11.5t-21 -14t-14.5 -14.5q-45 -60 -60 -159.5t-15 -308.5q0 -208 15 -307.5t60 -160.5q6 -8 15 -15t20.5 -14t17.5 -12q44 -33 239.5 -49t470.5 -16q610 0 697 65q5 4 17 11t20.5 14
+t13.5 16q46 60 61 159t15 309zM2048 1408v-1536h-2048v1536h2048z" />
+    <glyph glyph-name="_491" unicode="&#xf20b;" 
+d="M992 912v-496q0 -14 -9 -23t-23 -9h-160q-14 0 -23 9t-9 23v496q0 112 -80 192t-192 80h-272v-1152q0 -14 -9 -23t-23 -9h-160q-14 0 -23 9t-9 23v1344q0 14 9 23t23 9h464q135 0 249 -66.5t180.5 -180.5t66.5 -249zM1376 1376v-880q0 -135 -66.5 -249t-180.5 -180.5
+t-249 -66.5h-464q-14 0 -23 9t-9 23v960q0 14 9 23t23 9h160q14 0 23 -9t9 -23v-768h272q112 0 192 80t80 192v880q0 14 9 23t23 9h160q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="_492" unicode="&#xf20c;" 
+d="M1311 694v-114q0 -24 -13.5 -38t-37.5 -14h-202q-24 0 -38 14t-14 38v114q0 24 14 38t38 14h202q24 0 37.5 -14t13.5 -38zM821 464v250q0 53 -32.5 85.5t-85.5 32.5h-133q-68 0 -96 -52q-28 52 -96 52h-130q-53 0 -85.5 -32.5t-32.5 -85.5v-250q0 -22 21 -22h55
+q22 0 22 22v230q0 24 13.5 38t38.5 14h94q24 0 38 -14t14 -38v-230q0 -22 21 -22h54q22 0 22 22v230q0 24 14 38t38 14h97q24 0 37.5 -14t13.5 -38v-230q0 -22 22 -22h55q21 0 21 22zM1410 560v154q0 53 -33 85.5t-86 32.5h-264q-53 0 -86 -32.5t-33 -85.5v-410
+q0 -21 22 -21h55q21 0 21 21v180q31 -42 94 -42h191q53 0 86 32.5t33 85.5zM1536 1176v-1072q0 -96 -68 -164t-164 -68h-1072q-96 0 -164 68t-68 164v1072q0 96 68 164t164 68h1072q96 0 164 -68t68 -164z" />
+    <glyph glyph-name="_493" unicode="&#xf20d;" 
+d="M915 450h-294l147 551zM1001 128h311l-324 1024h-440l-324 -1024h311l383 314zM1536 1120v-960q0 -118 -85 -203t-203 -85h-960q-118 0 -203 85t-85 203v960q0 118 85 203t203 85h960q118 0 203 -85t85 -203z" />
+    <glyph glyph-name="_494" unicode="&#xf20e;" horiz-adv-x="2048" 
+d="M2048 641q0 -21 -13 -36.5t-33 -19.5l-205 -356q3 -9 3 -18q0 -20 -12.5 -35.5t-32.5 -19.5l-193 -337q3 -8 3 -16q0 -23 -16.5 -40t-40.5 -17q-25 0 -41 18h-400q-17 -20 -43 -20t-43 20h-399q-17 -20 -43 -20q-23 0 -40 16.5t-17 40.5q0 8 4 20l-193 335
+q-20 4 -32.5 19.5t-12.5 35.5q0 9 3 18l-206 356q-20 5 -32.5 20.5t-12.5 35.5q0 21 13.5 36.5t33.5 19.5l199 344q0 1 -0.5 3t-0.5 3q0 36 34 51l209 363q-4 10 -4 18q0 24 17 40.5t40 16.5q26 0 44 -21h396q16 21 43 21t43 -21h398q18 21 44 21q23 0 40 -16.5t17 -40.5
+q0 -6 -4 -18l207 -358q23 -1 39 -17.5t16 -38.5q0 -13 -7 -27l187 -324q19 -4 31.5 -19.5t12.5 -35.5zM1063 -158h389l-342 354h-143l-342 -354h360q18 16 39 16t39 -16zM112 654q1 -4 1 -13q0 -10 -2 -15l208 -360l15 -6l188 199v347l-187 194q-13 -8 -29 -10zM986 1438
+h-388l190 -200l554 200h-280q-16 -16 -38 -16t-38 16zM1689 226q1 6 5 11l-64 68l-17 -79h76zM1583 226l22 105l-252 266l-296 -307l63 -64h463zM1495 -142l16 28l65 310h-427l333 -343q8 4 13 5zM578 -158h5l342 354h-373v-335l4 -6q14 -5 22 -13zM552 226h402l64 66
+l-309 321l-157 -166v-221zM359 226h163v189l-168 -177q4 -8 5 -12zM358 1051q0 -1 0.5 -2t0.5 -2q0 -16 -8 -29l171 -177v269zM552 1121v-311l153 -157l297 314l-223 236zM556 1425l-4 -8v-264l205 74l-191 201q-6 -2 -10 -3zM1447 1438h-16l-621 -224l213 -225zM1023 946
+l-297 -315l311 -319l296 307zM688 634l-136 141v-284zM1038 270l-42 -44h85zM1374 618l238 -251l132 624l-3 5l-1 1zM1718 1018q-8 13 -8 29v2l-216 376q-5 1 -13 5l-437 -463l310 -327zM522 1142v223l-163 -282zM522 196h-163l163 -283v283zM1607 196l-48 -227l130 227h-82
+zM1729 266l207 361q-2 10 -2 14q0 1 3 16l-171 296l-129 -612l77 -82q5 3 15 7z" />
+    <glyph glyph-name="f210" unicode="&#xf210;" 
+d="M0 856q0 131 91.5 226.5t222.5 95.5h742l352 358v-1470q0 -132 -91.5 -227t-222.5 -95h-780q-131 0 -222.5 95t-91.5 227v790zM1232 102l-176 180v425q0 46 -32 79t-78 33h-484q-46 0 -78 -33t-32 -79v-492q0 -46 32.5 -79.5t77.5 -33.5h770z" />
+    <glyph glyph-name="_496" unicode="&#xf211;" 
+d="M934 1386q-317 -121 -556 -362.5t-358 -560.5q-20 89 -20 176q0 208 102.5 384.5t278.5 279t384 102.5q82 0 169 -19zM1203 1267q93 -65 164 -155q-389 -113 -674.5 -400.5t-396.5 -676.5q-93 72 -155 162q112 386 395 671t667 399zM470 -67q115 356 379.5 622t619.5 384
+q40 -92 54 -195q-292 -120 -516 -345t-343 -518q-103 14 -194 52zM1536 -125q-193 50 -367 115q-135 -84 -290 -107q109 205 274 370.5t369 275.5q-21 -152 -101 -284q65 -175 115 -370z" />
+    <glyph glyph-name="f212" unicode="&#xf212;" horiz-adv-x="2048" 
+d="M1893 1144l155 -1272q-131 0 -257 57q-200 91 -393 91q-226 0 -374 -148q-148 148 -374 148q-193 0 -393 -91q-128 -57 -252 -57h-5l155 1272q224 127 482 127q233 0 387 -106q154 106 387 106q258 0 482 -127zM1398 157q129 0 232 -28.5t260 -93.5l-124 1021
+q-171 78 -368 78q-224 0 -374 -141q-150 141 -374 141q-197 0 -368 -78l-124 -1021q105 43 165.5 65t148.5 39.5t178 17.5q202 0 374 -108q172 108 374 108zM1438 191l-55 907q-211 -4 -359 -155q-152 155 -374 155q-176 0 -336 -66l-114 -941q124 51 228.5 76t221.5 25
+q209 0 374 -102q172 107 374 102z" />
+    <glyph glyph-name="_498" unicode="&#xf213;" horiz-adv-x="2048" 
+d="M1500 165v733q0 21 -15 36t-35 15h-93q-20 0 -35 -15t-15 -36v-733q0 -20 15 -35t35 -15h93q20 0 35 15t15 35zM1216 165v531q0 20 -15 35t-35 15h-101q-20 0 -35 -15t-15 -35v-531q0 -20 15 -35t35 -15h101q20 0 35 15t15 35zM924 165v429q0 20 -15 35t-35 15h-101
+q-20 0 -35 -15t-15 -35v-429q0 -20 15 -35t35 -15h101q20 0 35 15t15 35zM632 165v362q0 20 -15 35t-35 15h-101q-20 0 -35 -15t-15 -35v-362q0 -20 15 -35t35 -15h101q20 0 35 15t15 35zM2048 311q0 -166 -118 -284t-284 -118h-1244q-166 0 -284 118t-118 284
+q0 116 63 214.5t168 148.5q-10 34 -10 73q0 113 80.5 193.5t193.5 80.5q102 0 180 -67q45 183 194 300t338 117q149 0 275 -73.5t199.5 -199.5t73.5 -275q0 -66 -14 -122q135 -33 221 -142.5t86 -247.5z" />
+    <glyph glyph-name="_499" unicode="&#xf214;" 
+d="M0 1536h1536v-1392l-776 -338l-760 338v1392zM1436 209v926h-1336v-926l661 -294zM1436 1235v201h-1336v-201h1336zM181 937v-115h-37v115h37zM181 789v-115h-37v115h37zM181 641v-115h-37v115h37zM181 493v-115h-37v115h37zM181 345v-115h-37v115h37zM207 202l15 34
+l105 -47l-15 -33zM343 142l15 34l105 -46l-15 -34zM478 82l15 34l105 -46l-15 -34zM614 23l15 33l104 -46l-15 -34zM797 10l105 46l15 -33l-105 -47zM932 70l105 46l15 -34l-105 -46zM1068 130l105 46l15 -34l-105 -46zM1203 189l105 47l15 -34l-105 -46zM259 1389v-36h-114
+v36h114zM421 1389v-36h-115v36h115zM583 1389v-36h-115v36h115zM744 1389v-36h-114v36h114zM906 1389v-36h-114v36h114zM1068 1389v-36h-115v36h115zM1230 1389v-36h-115v36h115zM1391 1389v-36h-114v36h114zM181 1049v-79h-37v115h115v-36h-78zM421 1085v-36h-115v36h115z
+M583 1085v-36h-115v36h115zM744 1085v-36h-114v36h114zM906 1085v-36h-114v36h114zM1068 1085v-36h-115v36h115zM1230 1085v-36h-115v36h115zM1355 970v79h-78v36h115v-115h-37zM1355 822v115h37v-115h-37zM1355 674v115h37v-115h-37zM1355 526v115h37v-115h-37zM1355 378
+v115h37v-115h-37zM1355 230v115h37v-115h-37zM760 265q-129 0 -221 91.5t-92 221.5q0 129 92 221t221 92q130 0 221.5 -92t91.5 -221q0 -130 -91.5 -221.5t-221.5 -91.5zM595 646q0 -36 19.5 -56.5t49.5 -25t64 -7t64 -2t49.5 -9t19.5 -30.5q0 -49 -112 -49q-97 0 -123 51
+h-3l-31 -63q67 -42 162 -42q29 0 56.5 5t55.5 16t45.5 33t17.5 53q0 46 -27.5 69.5t-67.5 27t-79.5 3t-67 5t-27.5 25.5q0 21 20.5 33t40.5 15t41 3q34 0 70.5 -11t51.5 -34h3l30 58q-3 1 -21 8.5t-22.5 9t-19.5 7t-22 7t-20 4.5t-24 4t-23 1q-29 0 -56.5 -5t-54 -16.5
+t-43 -34t-16.5 -53.5z" />
+    <glyph glyph-name="_500" unicode="&#xf215;" horiz-adv-x="2048" 
+d="M863 504q0 112 -79.5 191.5t-191.5 79.5t-191 -79.5t-79 -191.5t79 -191t191 -79t191.5 79t79.5 191zM1726 505q0 112 -79 191t-191 79t-191.5 -79t-79.5 -191q0 -113 79.5 -192t191.5 -79t191 79.5t79 191.5zM2048 1314v-1348q0 -44 -31.5 -75.5t-76.5 -31.5h-1832
+q-45 0 -76.5 31.5t-31.5 75.5v1348q0 44 31.5 75.5t76.5 31.5h431q44 0 76 -31.5t32 -75.5v-161h754v161q0 44 32 75.5t76 31.5h431q45 0 76.5 -31.5t31.5 -75.5z" />
+    <glyph glyph-name="_501" unicode="&#xf216;" horiz-adv-x="2048" 
+d="M1430 953zM1690 749q148 0 253 -98.5t105 -244.5q0 -157 -109 -261.5t-267 -104.5q-85 0 -162 27.5t-138 73.5t-118 106t-109 126t-103.5 132.5t-108.5 126.5t-117 106t-136 73.5t-159 27.5q-154 0 -251.5 -91.5t-97.5 -244.5q0 -157 104 -250t263 -93q100 0 208 37.5
+t193 98.5q5 4 21 18.5t30 24t22 9.5q14 0 24.5 -10.5t10.5 -24.5q0 -24 -60 -77q-101 -88 -234.5 -142t-260.5 -54q-133 0 -245.5 58t-180 165t-67.5 241q0 205 141.5 341t347.5 136q120 0 226.5 -43.5t185.5 -113t151.5 -153t139 -167.5t133.5 -153.5t149.5 -113
+t172.5 -43.5q102 0 168.5 61.5t66.5 162.5q0 95 -64.5 159t-159.5 64q-30 0 -81.5 -18.5t-68.5 -18.5q-20 0 -35.5 15t-15.5 35q0 18 8.5 57t8.5 59q0 159 -107.5 263t-266.5 104q-58 0 -111.5 -18.5t-84 -40.5t-55.5 -40.5t-33 -18.5q-15 0 -25.5 10.5t-10.5 25.5
+q0 19 25 46q59 67 147 103.5t182 36.5q191 0 318 -125.5t127 -315.5q0 -37 -4 -66q57 15 115 15z" />
+    <glyph glyph-name="_502" unicode="&#xf217;" horiz-adv-x="1664" 
+d="M1216 832q0 26 -19 45t-45 19h-128v128q0 26 -19 45t-45 19t-45 -19t-19 -45v-128h-128q-26 0 -45 -19t-19 -45t19 -45t45 -19h128v-128q0 -26 19 -45t45 -19t45 19t19 45v128h128q26 0 45 19t19 45zM640 0q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5
+t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1536 0q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1664 1088v-512q0 -24 -16 -42.5t-41 -21.5l-1044 -122q1 -7 4.5 -21.5t6 -26.5t2.5 -22q0 -16 -24 -64h920
+q26 0 45 -19t19 -45t-19 -45t-45 -19h-1024q-26 0 -45 19t-19 45q0 14 11 39.5t29.5 59.5t20.5 38l-177 823h-204q-26 0 -45 19t-19 45t19 45t45 19h256q16 0 28.5 -6.5t20 -15.5t13 -24.5t7.5 -26.5t5.5 -29.5t4.5 -25.5h1201q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="_503" unicode="&#xf218;" horiz-adv-x="1664" 
+d="M1280 832q0 26 -19 45t-45 19t-45 -19l-147 -146v293q0 26 -19 45t-45 19t-45 -19t-19 -45v-293l-147 146q-19 19 -45 19t-45 -19t-19 -45t19 -45l256 -256q19 -19 45 -19t45 19l256 256q19 19 19 45zM640 0q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5
+t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1536 0q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1664 1088v-512q0 -24 -16 -42.5t-41 -21.5l-1044 -122q1 -7 4.5 -21.5t6 -26.5t2.5 -22q0 -16 -24 -64h920
+q26 0 45 -19t19 -45t-19 -45t-45 -19h-1024q-26 0 -45 19t-19 45q0 14 11 39.5t29.5 59.5t20.5 38l-177 823h-204q-26 0 -45 19t-19 45t19 45t45 19h256q16 0 28.5 -6.5t20 -15.5t13 -24.5t7.5 -26.5t5.5 -29.5t4.5 -25.5h1201q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="_504" unicode="&#xf219;" horiz-adv-x="2048" 
+d="M212 768l623 -665l-300 665h-323zM1024 -4l349 772h-698zM538 896l204 384h-262l-288 -384h346zM1213 103l623 665h-323zM683 896h682l-204 384h-274zM1510 896h346l-288 384h-262zM1651 1382l384 -512q14 -18 13 -41.5t-17 -40.5l-960 -1024q-18 -20 -47 -20t-47 20
+l-960 1024q-16 17 -17 40.5t13 41.5l384 512q18 26 51 26h1152q33 0 51 -26z" />
+    <glyph glyph-name="_505" unicode="&#xf21a;" horiz-adv-x="2048" 
+d="M1811 -19q19 19 45 19t45 -19l128 -128l-90 -90l-83 83l-83 -83q-18 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83
+q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-128 128l90 90l83 -83l83 83q19 19 45 19t45 -19l83 -83l83 83q19 19 45 19t45 -19l83 -83l83 83q19 19 45 19t45 -19l83 -83l83 83q19 19 45 19t45 -19l83 -83l83 83q19 19 45 19t45 -19l83 -83l83 83
+q19 19 45 19t45 -19l83 -83zM237 19q-19 -19 -45 -19t-45 19l-128 128l90 90l83 -82l83 82q19 19 45 19t45 -19l83 -82l64 64v293l-210 314q-17 26 -7 56.5t40 40.5l177 58v299h128v128h256v128h256v-128h256v-128h128v-299l177 -58q30 -10 40 -40.5t-7 -56.5l-210 -314
+v-293l19 18q19 19 45 19t45 -19l83 -82l83 82q19 19 45 19t45 -19l128 -128l-90 -90l-83 83l-83 -83q-18 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83l-83 -83
+q-19 -19 -45 -19t-45 19l-83 83l-83 -83q-19 -19 -45 -19t-45 19l-83 83zM640 1152v-128l384 128l384 -128v128h-128v128h-512v-128h-128z" />
+    <glyph glyph-name="_506" unicode="&#xf21b;" 
+d="M576 0l96 448l-96 128l-128 64zM832 0l128 640l-128 -64l-96 -128zM992 1010q-2 4 -4 6q-10 8 -96 8q-70 0 -167 -19q-7 -2 -21 -2t-21 2q-97 19 -167 19q-86 0 -96 -8q-2 -2 -4 -6q2 -18 4 -27q2 -3 7.5 -6.5t7.5 -10.5q2 -4 7.5 -20.5t7 -20.5t7.5 -17t8.5 -17t9 -14
+t12 -13.5t14 -9.5t17.5 -8t20.5 -4t24.5 -2q36 0 59 12.5t32.5 30t14.5 34.5t11.5 29.5t17.5 12.5h12q11 0 17.5 -12.5t11.5 -29.5t14.5 -34.5t32.5 -30t59 -12.5q13 0 24.5 2t20.5 4t17.5 8t14 9.5t12 13.5t9 14t8.5 17t7.5 17t7 20.5t7.5 20.5q2 7 7.5 10.5t7.5 6.5
+q2 9 4 27zM1408 131q0 -121 -73 -190t-194 -69h-874q-121 0 -194 69t-73 190q0 61 4.5 118t19 125.5t37.5 123.5t63.5 103.5t93.5 74.5l-90 220h214q-22 64 -22 128q0 12 2 32q-194 40 -194 96q0 57 210 99q17 62 51.5 134t70.5 114q32 37 76 37q30 0 84 -31t84 -31t84 31
+t84 31q44 0 76 -37q36 -42 70.5 -114t51.5 -134q210 -42 210 -99q0 -56 -194 -96q7 -81 -20 -160h214l-82 -225q63 -33 107.5 -96.5t65.5 -143.5t29 -151.5t8 -148.5z" />
+    <glyph glyph-name="_507" unicode="&#xf21c;" horiz-adv-x="2304" 
+d="M2301 500q12 -103 -22 -198.5t-99 -163.5t-158.5 -106t-196.5 -31q-161 11 -279.5 125t-134.5 274q-12 111 27.5 210.5t118.5 170.5l-71 107q-96 -80 -151 -194t-55 -244q0 -27 -18.5 -46.5t-45.5 -19.5h-256h-69q-23 -164 -149 -274t-294 -110q-185 0 -316.5 131.5
+t-131.5 316.5t131.5 316.5t316.5 131.5q76 0 152 -27l24 45q-123 110 -304 110h-64q-26 0 -45 19t-19 45t19 45t45 19h128q78 0 145 -13.5t116.5 -38.5t71.5 -39.5t51 -36.5h512h115l-85 128h-222q-30 0 -49 22.5t-14 52.5q4 23 23 38t43 15h253q33 0 53 -28l70 -105
+l114 114q19 19 46 19h101q26 0 45 -19t19 -45v-128q0 -26 -19 -45t-45 -19h-179l115 -172q131 63 275 36q143 -26 244 -134.5t118 -253.5zM448 128q115 0 203 72.5t111 183.5h-314q-35 0 -55 31q-18 32 -1 63l147 277q-47 13 -91 13q-132 0 -226 -94t-94 -226t94 -226
+t226 -94zM1856 128q132 0 226 94t94 226t-94 226t-226 94q-60 0 -121 -24l174 -260q15 -23 10 -49t-27 -40q-15 -11 -36 -11q-35 0 -53 29l-174 260q-93 -95 -93 -225q0 -132 94 -226t226 -94z" />
+    <glyph glyph-name="_508" unicode="&#xf21d;" 
+d="M1408 0q0 -63 -61.5 -113.5t-164 -81t-225 -46t-253.5 -15.5t-253.5 15.5t-225 46t-164 81t-61.5 113.5q0 49 33 88.5t91 66.5t118 44.5t131 29.5q26 5 48 -10.5t26 -41.5q5 -26 -10.5 -48t-41.5 -26q-58 -10 -106 -23.5t-76.5 -25.5t-48.5 -23.5t-27.5 -19.5t-8.5 -12
+q3 -11 27 -26.5t73 -33t114 -32.5t160.5 -25t201.5 -10t201.5 10t160.5 25t114 33t73 33.5t27 27.5q-1 4 -8.5 11t-27.5 19t-48.5 23.5t-76.5 25t-106 23.5q-26 4 -41.5 26t-10.5 48q4 26 26 41.5t48 10.5q71 -12 131 -29.5t118 -44.5t91 -66.5t33 -88.5zM1024 896v-384
+q0 -26 -19 -45t-45 -19h-64v-384q0 -26 -19 -45t-45 -19h-256q-26 0 -45 19t-19 45v384h-64q-26 0 -45 19t-19 45v384q0 53 37.5 90.5t90.5 37.5h384q53 0 90.5 -37.5t37.5 -90.5zM928 1280q0 -93 -65.5 -158.5t-158.5 -65.5t-158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5
+t158.5 -65.5t65.5 -158.5z" />
+    <glyph glyph-name="_509" unicode="&#xf21e;" horiz-adv-x="1792" 
+d="M1280 512h305q-5 -6 -10 -10.5t-9 -7.5l-3 -4l-623 -600q-18 -18 -44 -18t-44 18l-624 602q-5 2 -21 20h369q22 0 39.5 13.5t22.5 34.5l70 281l190 -667q6 -20 23 -33t39 -13q21 0 38 13t23 33l146 485l56 -112q18 -35 57 -35zM1792 940q0 -145 -103 -300h-369l-111 221
+q-8 17 -25.5 27t-36.5 8q-45 -5 -56 -46l-129 -430l-196 686q-6 20 -23.5 33t-39.5 13t-39 -13.5t-22 -34.5l-116 -464h-423q-103 155 -103 300q0 220 127 344t351 124q62 0 126.5 -21.5t120 -58t95.5 -68.5t76 -68q36 36 76 68t95.5 68.5t120 58t126.5 21.5q224 0 351 -124
+t127 -344z" />
+    <glyph glyph-name="venus" unicode="&#xf221;" horiz-adv-x="1280" 
+d="M1152 960q0 -221 -147.5 -384.5t-364.5 -187.5v-260h224q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-224v-224q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v224h-224q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h224v260q-150 16 -271.5 103t-186 224t-52.5 292
+q11 134 80.5 249t182 188t245.5 88q170 19 319 -54t236 -212t87 -306zM128 960q0 -185 131.5 -316.5t316.5 -131.5t316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5z" />
+    <glyph glyph-name="_511" unicode="&#xf222;" 
+d="M1472 1408q26 0 45 -19t19 -45v-416q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v262l-382 -383q126 -156 126 -359q0 -117 -45.5 -223.5t-123 -184t-184 -123t-223.5 -45.5t-223.5 45.5t-184 123t-123 184t-45.5 223.5t45.5 223.5t123 184t184 123t223.5 45.5
+q203 0 359 -126l382 382h-261q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h416zM576 0q185 0 316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_512" unicode="&#xf223;" horiz-adv-x="1280" 
+d="M830 1220q145 -72 233.5 -210.5t88.5 -305.5q0 -221 -147.5 -384.5t-364.5 -187.5v-132h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96v-96q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v96h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96v132q-217 24 -364.5 187.5
+t-147.5 384.5q0 167 88.5 305.5t233.5 210.5q-165 96 -228 273q-6 16 3.5 29.5t26.5 13.5h69q21 0 29 -20q44 -106 140 -171t214 -65t214 65t140 171q8 20 37 20h61q17 0 26.5 -13.5t3.5 -29.5q-63 -177 -228 -273zM576 256q185 0 316.5 131.5t131.5 316.5t-131.5 316.5
+t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_513" unicode="&#xf224;" 
+d="M1024 1504q0 14 9 23t23 9h288q26 0 45 -19t19 -45v-288q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v134l-254 -255q126 -158 126 -359q0 -221 -147.5 -384.5t-364.5 -187.5v-132h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96v-96q0 -14 -9 -23t-23 -9h-64
+q-14 0 -23 9t-9 23v96h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96v132q-149 16 -270.5 103t-186.5 223.5t-53 291.5q16 204 160 353.5t347 172.5q118 14 228 -19t198 -103l255 254h-134q-14 0 -23 9t-9 23v64zM576 256q185 0 316.5 131.5t131.5 316.5t-131.5 316.5
+t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_514" unicode="&#xf225;" horiz-adv-x="1792" 
+d="M1280 1504q0 14 9 23t23 9h288q26 0 45 -19t19 -45v-288q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v134l-254 -255q126 -158 126 -359q0 -221 -147.5 -384.5t-364.5 -187.5v-132h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96v-96q0 -14 -9 -23t-23 -9h-64
+q-14 0 -23 9t-9 23v96h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96v132q-217 24 -364.5 187.5t-147.5 384.5q0 201 126 359l-52 53l-101 -111q-9 -10 -22 -10.5t-23 7.5l-48 44q-10 8 -10.5 21.5t8.5 23.5l105 115l-111 112v-134q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9
+t-9 23v288q0 26 19 45t45 19h288q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-133l106 -107l86 94q9 10 22 10.5t23 -7.5l48 -44q10 -8 10.5 -21.5t-8.5 -23.5l-90 -99l57 -56q158 126 359 126t359 -126l255 254h-134q-14 0 -23 9t-9 23v64zM832 256q185 0 316.5 131.5
+t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_515" unicode="&#xf226;" horiz-adv-x="1792" 
+d="M1790 1007q12 -155 -52.5 -292t-186 -224t-271.5 -103v-260h224q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-224v-224q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v224h-512v-224q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v224h-224q-14 0 -23 9t-9 23v64q0 14 9 23
+t23 9h224v260q-150 16 -271.5 103t-186 224t-52.5 292q17 206 164.5 356.5t352.5 169.5q206 21 377 -94q171 115 377 94q205 -19 352.5 -169.5t164.5 -356.5zM896 647q128 131 128 313t-128 313q-128 -131 -128 -313t128 -313zM576 512q115 0 218 57q-154 165 -154 391
+q0 224 154 391q-103 57 -218 57q-185 0 -316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5zM1152 128v260q-137 15 -256 94q-119 -79 -256 -94v-260h512zM1216 512q185 0 316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5q-115 0 -218 -57q154 -167 154 -391
+q0 -226 -154 -391q103 -57 218 -57z" />
+    <glyph glyph-name="_516" unicode="&#xf227;" horiz-adv-x="1920" 
+d="M1536 1120q0 14 9 23t23 9h288q26 0 45 -19t19 -45v-288q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v134l-254 -255q76 -95 107.5 -214t9.5 -247q-31 -182 -166 -312t-318 -156q-210 -29 -384.5 80t-241.5 300q-117 6 -221 57.5t-177.5 133t-113.5 192.5t-32 230
+q9 135 78 252t182 191.5t248 89.5q118 14 227.5 -19t198.5 -103l255 254h-134q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h288q26 0 45 -19t19 -45v-288q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v134l-254 -255q59 -74 93 -169q182 -9 328 -124l255 254h-134q-14 0 -23 9
+t-9 23v64zM1024 704q0 20 -4 58q-162 -25 -271 -150t-109 -292q0 -20 4 -58q162 25 271 150t109 292zM128 704q0 -168 111 -294t276 -149q-3 29 -3 59q0 210 135 369.5t338 196.5q-53 120 -163.5 193t-245.5 73q-185 0 -316.5 -131.5t-131.5 -316.5zM1088 -128
+q185 0 316.5 131.5t131.5 316.5q0 168 -111 294t-276 149q3 -28 3 -59q0 -210 -135 -369.5t-338 -196.5q53 -120 163.5 -193t245.5 -73z" />
+    <glyph glyph-name="_517" unicode="&#xf228;" horiz-adv-x="2048" 
+d="M1664 1504q0 14 9 23t23 9h288q26 0 45 -19t19 -45v-288q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v134l-254 -255q76 -95 107.5 -214t9.5 -247q-32 -180 -164.5 -310t-313.5 -157q-223 -34 -409 90q-117 -78 -256 -93v-132h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23
+t-23 -9h-96v-96q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v96h-96q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96v132q-155 17 -279.5 109.5t-187 237.5t-39.5 307q25 187 159.5 322.5t320.5 164.5q224 34 410 -90q146 97 320 97q201 0 359 -126l255 254h-134q-14 0 -23 9
+t-9 23v64zM896 391q128 131 128 313t-128 313q-128 -131 -128 -313t128 -313zM128 704q0 -185 131.5 -316.5t316.5 -131.5q117 0 218 57q-154 167 -154 391t154 391q-101 57 -218 57q-185 0 -316.5 -131.5t-131.5 -316.5zM1216 256q185 0 316.5 131.5t131.5 316.5
+t-131.5 316.5t-316.5 131.5q-117 0 -218 -57q154 -167 154 -391t-154 -391q101 -57 218 -57z" />
+    <glyph glyph-name="_518" unicode="&#xf229;" 
+d="M1472 1408q26 0 45 -19t19 -45v-416q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v262l-213 -214l140 -140q9 -10 9 -23t-9 -22l-46 -46q-9 -9 -22 -9t-23 9l-140 141l-78 -79q126 -156 126 -359q0 -117 -45.5 -223.5t-123 -184t-184 -123t-223.5 -45.5t-223.5 45.5
+t-184 123t-123 184t-45.5 223.5t45.5 223.5t123 184t184 123t223.5 45.5q203 0 359 -126l78 78l-172 172q-9 10 -9 23t9 22l46 46q9 9 22 9t23 -9l172 -172l213 213h-261q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h416zM576 0q185 0 316.5 131.5t131.5 316.5t-131.5 316.5
+t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_519" unicode="&#xf22a;" horiz-adv-x="1280" 
+d="M640 892q217 -24 364.5 -187.5t147.5 -384.5q0 -167 -87 -306t-236 -212t-319 -54q-133 15 -245.5 88t-182 188t-80.5 249q-12 155 52.5 292t186 224t271.5 103v132h-160q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h160v165l-92 -92q-10 -9 -23 -9t-22 9l-46 46q-9 9 -9 22
+t9 23l202 201q19 19 45 19t45 -19l202 -201q9 -10 9 -23t-9 -22l-46 -46q-9 -9 -22 -9t-23 9l-92 92v-165h160q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-160v-132zM576 -128q185 0 316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5
+t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_520" unicode="&#xf22b;" horiz-adv-x="2048" 
+d="M1901 621q19 -19 19 -45t-19 -45l-294 -294q-9 -10 -22.5 -10t-22.5 10l-45 45q-10 9 -10 22.5t10 22.5l185 185h-294v-224q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v224h-132q-24 -217 -187.5 -364.5t-384.5 -147.5q-167 0 -306 87t-212 236t-54 319q15 133 88 245.5
+t188 182t249 80.5q155 12 292 -52.5t224 -186t103 -271.5h132v224q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-224h294l-185 185q-10 9 -10 22.5t10 22.5l45 45q9 10 22.5 10t22.5 -10zM576 128q185 0 316.5 131.5t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5
+t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_521" unicode="&#xf22c;" horiz-adv-x="1280" 
+d="M1152 960q0 -221 -147.5 -384.5t-364.5 -187.5v-612q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v612q-217 24 -364.5 187.5t-147.5 384.5q0 117 45.5 223.5t123 184t184 123t223.5 45.5t223.5 -45.5t184 -123t123 -184t45.5 -223.5zM576 512q185 0 316.5 131.5
+t131.5 316.5t-131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5z" />
+    <glyph glyph-name="_522" unicode="&#xf22d;" horiz-adv-x="1280" 
+d="M1024 576q0 185 -131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5t131.5 -316.5t316.5 -131.5t316.5 131.5t131.5 316.5zM1152 576q0 -117 -45.5 -223.5t-123 -184t-184 -123t-223.5 -45.5t-223.5 45.5t-184 123t-123 184t-45.5 223.5t45.5 223.5t123 184t184 123
+t223.5 45.5t223.5 -45.5t184 -123t123 -184t45.5 -223.5z" />
+    <glyph glyph-name="_523" unicode="&#xf22e;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="_524" unicode="&#xf22f;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="_525" unicode="&#xf230;" 
+d="M1451 1408q35 0 60 -25t25 -60v-1366q0 -35 -25 -60t-60 -25h-391v595h199l30 232h-229v148q0 56 23.5 84t91.5 28l122 1v207q-63 9 -178 9q-136 0 -217.5 -80t-81.5 -226v-171h-200v-232h200v-595h-735q-35 0 -60 25t-25 60v1366q0 35 25 60t60 25h1366z" />
+    <glyph glyph-name="_526" unicode="&#xf231;" horiz-adv-x="1280" 
+d="M0 939q0 108 37.5 203.5t103.5 166.5t152 123t185 78t202 26q158 0 294 -66.5t221 -193.5t85 -287q0 -96 -19 -188t-60 -177t-100 -149.5t-145 -103t-189 -38.5q-68 0 -135 32t-96 88q-10 -39 -28 -112.5t-23.5 -95t-20.5 -71t-26 -71t-32 -62.5t-46 -77.5t-62 -86.5
+l-14 -5l-9 10q-15 157 -15 188q0 92 21.5 206.5t66.5 287.5t52 203q-32 65 -32 169q0 83 52 156t132 73q61 0 95 -40.5t34 -102.5q0 -66 -44 -191t-44 -187q0 -63 45 -104.5t109 -41.5q55 0 102 25t78.5 68t56 95t38 110.5t20 111t6.5 99.5q0 173 -109.5 269.5t-285.5 96.5
+q-200 0 -334 -129.5t-134 -328.5q0 -44 12.5 -85t27 -65t27 -45.5t12.5 -30.5q0 -28 -15 -73t-37 -45q-2 0 -17 3q-51 15 -90.5 56t-61 94.5t-32.5 108t-11 106.5z" />
+    <glyph glyph-name="_527" unicode="&#xf232;" 
+d="M985 562q13 0 97.5 -44t89.5 -53q2 -5 2 -15q0 -33 -17 -76q-16 -39 -71 -65.5t-102 -26.5q-57 0 -190 62q-98 45 -170 118t-148 185q-72 107 -71 194v8q3 91 74 158q24 22 52 22q6 0 18 -1.5t19 -1.5q19 0 26.5 -6.5t15.5 -27.5q8 -20 33 -88t25 -75q0 -21 -34.5 -57.5
+t-34.5 -46.5q0 -7 5 -15q34 -73 102 -137q56 -53 151 -101q12 -7 22 -7q15 0 54 48.5t52 48.5zM782 32q127 0 243.5 50t200.5 134t134 200.5t50 243.5t-50 243.5t-134 200.5t-200.5 134t-243.5 50t-243.5 -50t-200.5 -134t-134 -200.5t-50 -243.5q0 -203 120 -368l-79 -233
+l242 77q158 -104 345 -104zM782 1414q153 0 292.5 -60t240.5 -161t161 -240.5t60 -292.5t-60 -292.5t-161 -240.5t-240.5 -161t-292.5 -60q-195 0 -365 94l-417 -134l136 405q-108 178 -108 389q0 153 60 292.5t161 240.5t240.5 161t292.5 60z" />
+    <glyph glyph-name="_528" unicode="&#xf233;" horiz-adv-x="1792" 
+d="M128 128h1024v128h-1024v-128zM128 640h1024v128h-1024v-128zM1696 192q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM128 1152h1024v128h-1024v-128zM1696 704q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM1696 1216
+q0 40 -28 68t-68 28t-68 -28t-28 -68t28 -68t68 -28t68 28t28 68zM1792 384v-384h-1792v384h1792zM1792 896v-384h-1792v384h1792zM1792 1408v-384h-1792v384h1792z" />
+    <glyph glyph-name="_529" unicode="&#xf234;" horiz-adv-x="2048" 
+d="M704 640q-159 0 -271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5t271.5 -112.5t112.5 -271.5t-112.5 -271.5t-271.5 -112.5zM1664 512h352q13 0 22.5 -9.5t9.5 -22.5v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-352v-352q0 -13 -9.5 -22.5t-22.5 -9.5h-192q-13 0 -22.5 9.5
+t-9.5 22.5v352h-352q-13 0 -22.5 9.5t-9.5 22.5v192q0 13 9.5 22.5t22.5 9.5h352v352q0 13 9.5 22.5t22.5 9.5h192q13 0 22.5 -9.5t9.5 -22.5v-352zM928 288q0 -52 38 -90t90 -38h256v-238q-68 -50 -171 -50h-874q-121 0 -194 69t-73 190q0 53 3.5 103.5t14 109t26.5 108.5
+t43 97.5t62 81t85.5 53.5t111.5 20q19 0 39 -17q79 -61 154.5 -91.5t164.5 -30.5t164.5 30.5t154.5 91.5q20 17 39 17q132 0 217 -96h-223q-52 0 -90 -38t-38 -90v-192z" />
+    <glyph glyph-name="_530" unicode="&#xf235;" horiz-adv-x="2048" 
+d="M704 640q-159 0 -271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5t271.5 -112.5t112.5 -271.5t-112.5 -271.5t-271.5 -112.5zM1781 320l249 -249q9 -9 9 -23q0 -13 -9 -22l-136 -136q-9 -9 -22 -9q-14 0 -23 9l-249 249l-249 -249q-9 -9 -23 -9q-13 0 -22 9l-136 136
+q-9 9 -9 22q0 14 9 23l249 249l-249 249q-9 9 -9 23q0 13 9 22l136 136q9 9 22 9q14 0 23 -9l249 -249l249 249q9 9 23 9q13 0 22 -9l136 -136q9 -9 9 -22q0 -14 -9 -23zM1283 320l-181 -181q-37 -37 -37 -91q0 -53 37 -90l83 -83q-21 -3 -44 -3h-874q-121 0 -194 69
+t-73 190q0 53 3.5 103.5t14 109t26.5 108.5t43 97.5t62 81t85.5 53.5t111.5 20q19 0 39 -17q154 -122 319 -122t319 122q20 17 39 17q28 0 57 -6q-28 -27 -41 -50t-13 -56q0 -54 37 -91z" />
+    <glyph glyph-name="_531" unicode="&#xf236;" horiz-adv-x="2048" 
+d="M256 512h1728q26 0 45 -19t19 -45v-448h-256v256h-1536v-256h-256v1216q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-704zM832 832q0 106 -75 181t-181 75t-181 -75t-75 -181t75 -181t181 -75t181 75t75 181zM2048 576v64q0 159 -112.5 271.5t-271.5 112.5h-704
+q-26 0 -45 -19t-19 -45v-384h1152z" />
+    <glyph glyph-name="_532" unicode="&#xf237;" 
+d="M1536 1536l-192 -448h192v-192h-274l-55 -128h329v-192h-411l-357 -832l-357 832h-411v192h329l-55 128h-274v192h192l-192 448h256l323 -768h378l323 768h256zM768 320l108 256h-216z" />
+    <glyph glyph-name="_533" unicode="&#xf238;" 
+d="M1088 1536q185 0 316.5 -93.5t131.5 -226.5v-896q0 -130 -125.5 -222t-305.5 -97l213 -202q16 -15 8 -35t-30 -20h-1056q-22 0 -30 20t8 35l213 202q-180 5 -305.5 97t-125.5 222v896q0 133 131.5 226.5t316.5 93.5h640zM768 192q80 0 136 56t56 136t-56 136t-136 56
+t-136 -56t-56 -136t56 -136t136 -56zM1344 768v512h-1152v-512h1152z" />
+    <glyph glyph-name="_534" unicode="&#xf239;" 
+d="M1088 1536q185 0 316.5 -93.5t131.5 -226.5v-896q0 -130 -125.5 -222t-305.5 -97l213 -202q16 -15 8 -35t-30 -20h-1056q-22 0 -30 20t8 35l213 202q-180 5 -305.5 97t-125.5 222v896q0 133 131.5 226.5t316.5 93.5h640zM288 224q66 0 113 47t47 113t-47 113t-113 47
+t-113 -47t-47 -113t47 -113t113 -47zM704 768v512h-544v-512h544zM1248 224q66 0 113 47t47 113t-47 113t-113 47t-113 -47t-47 -113t47 -113t113 -47zM1408 768v512h-576v-512h576z" />
+    <glyph glyph-name="_535" unicode="&#xf23a;" horiz-adv-x="1792" 
+d="M597 1115v-1173q0 -25 -12.5 -42.5t-36.5 -17.5q-17 0 -33 8l-465 233q-21 10 -35.5 33.5t-14.5 46.5v1140q0 20 10 34t29 14q14 0 44 -15l511 -256q3 -3 3 -5zM661 1014l534 -866l-534 266v600zM1792 996v-1054q0 -25 -14 -40.5t-38 -15.5t-47 13l-441 220zM1789 1116
+q0 -3 -256.5 -419.5t-300.5 -487.5l-390 634l324 527q17 28 52 28q14 0 26 -6l541 -270q4 -2 4 -6z" />
+    <glyph glyph-name="_536" unicode="&#xf23b;" 
+d="M809 532l266 499h-112l-157 -312q-24 -48 -44 -92l-42 92l-155 312h-120l263 -493v-324h101v318zM1536 1408v-1536h-1536v1536h1536z" />
+    <glyph glyph-name="_537" unicode="&#xf23c;" horiz-adv-x="2296" 
+d="M478 -139q-8 -16 -27 -34.5t-37 -25.5q-25 -9 -51.5 3.5t-28.5 31.5q-1 22 40 55t68 38q23 4 34 -21.5t2 -46.5zM1819 -139q7 -16 26 -34.5t38 -25.5q25 -9 51.5 3.5t27.5 31.5q2 22 -39.5 55t-68.5 38q-22 4 -33 -21.5t-2 -46.5zM1867 -30q13 -27 56.5 -59.5t77.5 -41.5
+q45 -13 82 4.5t37 50.5q0 46 -67.5 100.5t-115.5 59.5q-40 5 -63.5 -37.5t-6.5 -76.5zM428 -30q-13 -27 -56 -59.5t-77 -41.5q-45 -13 -82 4.5t-37 50.5q0 46 67.5 100.5t115.5 59.5q40 5 63 -37.5t6 -76.5zM1158 1094h1q-41 0 -76 -15q27 -8 44 -30.5t17 -49.5
+q0 -35 -27 -60t-65 -25q-52 0 -80 43q-5 -23 -5 -42q0 -74 56 -126.5t135 -52.5q80 0 136 52.5t56 126.5t-56 126.5t-136 52.5zM1462 1312q-99 109 -220.5 131.5t-245.5 -44.5q27 60 82.5 96.5t118 39.5t121.5 -17t99.5 -74.5t44.5 -131.5zM2212 73q8 -11 -11 -42
+q7 -23 7 -40q1 -56 -44.5 -112.5t-109.5 -91.5t-118 -37q-48 -2 -92 21.5t-66 65.5q-687 -25 -1259 0q-23 -41 -66.5 -65t-92.5 -22q-86 3 -179.5 80.5t-92.5 160.5q2 22 7 40q-19 31 -11 42q6 10 31 1q14 22 41 51q-7 29 2 38q11 10 39 -4q29 20 59 34q0 29 13 37
+q23 12 51 -16q35 5 61 -2q18 -4 38 -19v73q-11 0 -18 2q-53 10 -97 44.5t-55 87.5q-9 38 0 81q15 62 93 95q2 17 19 35.5t36 23.5t33 -7.5t19 -30.5h13q46 -5 60 -23q3 -3 5 -7q10 1 30.5 3.5t30.5 3.5q-15 11 -30 17q-23 40 -91 43q0 6 1 10q-62 2 -118.5 18.5t-84.5 47.5
+q-32 36 -42.5 92t-2.5 112q16 126 90 179q23 16 52 4.5t32 -40.5q0 -1 1.5 -14t2.5 -21t3 -20t5.5 -19t8.5 -10q27 -14 76 -12q48 46 98 74q-40 4 -162 -14l47 46q61 58 163 111q145 73 282 86q-20 8 -41 15.5t-47 14t-42.5 10.5t-47.5 11t-43 10q595 126 904 -139
+q98 -84 158 -222q85 -10 121 9h1q5 3 8.5 10t5.5 19t3 19.5t3 21.5l1 14q3 28 32 40t52 -5q73 -52 91 -178q7 -57 -3.5 -113t-42.5 -91q-28 -32 -83.5 -48.5t-115.5 -18.5v-10q-71 -2 -95 -43q-14 -5 -31 -17q11 -1 32 -3.5t30 -3.5q1 5 5 8q16 18 60 23h13q5 18 19 30t33 8
+t36 -23t19 -36q79 -32 93 -95q9 -40 1 -81q-12 -53 -56 -88t-97 -44q-10 -2 -17 -2q0 -49 -1 -73q20 15 38 19q26 7 61 2q28 28 51 16q14 -9 14 -37q33 -16 59 -34q27 13 38 4q10 -10 2 -38q28 -30 41 -51q23 8 31 -1zM1937 1025q0 -29 -9 -54q82 -32 112 -132
+q4 37 -9.5 98.5t-41.5 90.5q-20 19 -36 17t-16 -20zM1859 925q35 -42 47.5 -108.5t-0.5 -124.5q67 13 97 45q13 14 18 28q-3 64 -31 114.5t-79 66.5q-15 -15 -52 -21zM1822 921q-30 0 -44 1q42 -115 53 -239q21 0 43 3q16 68 1 135t-53 100zM258 839q30 100 112 132
+q-9 25 -9 54q0 18 -16.5 20t-35.5 -17q-28 -29 -41.5 -90.5t-9.5 -98.5zM294 737q29 -31 97 -45q-13 58 -0.5 124.5t47.5 108.5v0q-37 6 -52 21q-51 -16 -78.5 -66t-31.5 -115q9 -17 18 -28zM471 683q14 124 73 235q-19 -4 -55 -18l-45 -19v1q-46 -89 -20 -196q25 -3 47 -3z
+M1434 644q8 -38 16.5 -108.5t11.5 -89.5q3 -18 9.5 -21.5t23.5 4.5q40 20 62 85.5t23 125.5q-24 2 -146 4zM1152 1285q-116 0 -199 -82.5t-83 -198.5q0 -117 83 -199.5t199 -82.5t199 82.5t83 199.5q0 116 -83 198.5t-199 82.5zM1380 646q-105 2 -211 0v1q-1 -27 2.5 -86
+t13.5 -66q29 -14 93.5 -14.5t95.5 10.5q9 3 11 39t-0.5 69.5t-4.5 46.5zM1112 447q8 4 9.5 48t-0.5 88t-4 63v1q-212 -3 -214 -3q-4 -20 -7 -62t0 -83t14 -46q34 -15 101 -16t101 10zM718 636q-16 -59 4.5 -118.5t77.5 -84.5q15 -8 24 -5t12 21q3 16 8 90t10 103
+q-69 -2 -136 -6zM591 510q3 -23 -34 -36q132 -141 271.5 -240t305.5 -154q172 49 310.5 146t293.5 250q-33 13 -30 34q0 2 0.5 3.5t1.5 3t1 2.5v1v-1q-17 2 -50 5.5t-48 4.5q-26 -90 -82 -132q-51 -38 -82 1q-5 6 -9 14q-7 13 -17 62q-2 -5 -5 -9t-7.5 -7t-8 -5.5t-9.5 -4
+l-10 -2.5t-12 -2l-12 -1.5t-13.5 -1t-13.5 -0.5q-106 -9 -163 11q-4 -17 -10 -26.5t-21 -15t-23 -7t-36 -3.5q-6 -1 -9 -1q-179 -17 -203 40q-2 -63 -56 -54q-47 8 -91 54q-12 13 -20 26q-17 29 -26 65q-58 -6 -87 -10q1 -2 4 -10zM507 -118q3 14 3 30q-17 71 -51 130
+t-73 70q-41 12 -101.5 -14.5t-104.5 -80t-39 -107.5q35 -53 100 -93t119 -42q51 -2 94 28t53 79zM510 53q23 -63 27 -119q195 113 392 174q-98 52 -180.5 120t-179.5 165q-6 -4 -29 -13q0 -1 -1 -4t-1 -5q31 -18 22 -37q-12 -23 -56 -34q-10 -13 -29 -24h-1q-2 -83 1 -150
+q19 -34 35 -73zM579 -113q532 -21 1145 0q-254 147 -428 196q-76 -35 -156 -57q-8 -3 -16 0q-65 21 -129 49q-208 -60 -416 -188h-1v-1q1 0 1 1zM1763 -67q4 54 28 120q14 38 33 71l-1 -1q3 77 3 153q-15 8 -30 25q-42 9 -56 33q-9 20 22 38q-2 4 -2 9q-16 4 -28 12
+q-204 -190 -383 -284q198 -59 414 -176zM2155 -90q5 54 -39 107.5t-104 80t-102 14.5q-38 -11 -72.5 -70.5t-51.5 -129.5q0 -16 3 -30q10 -49 53 -79t94 -28q54 2 119 42t100 93z" />
+    <glyph glyph-name="_538" unicode="&#xf23d;" horiz-adv-x="2304" 
+d="M1524 -25q0 -68 -48 -116t-116 -48t-116.5 48t-48.5 116t48.5 116.5t116.5 48.5t116 -48.5t48 -116.5zM775 -25q0 -68 -48.5 -116t-116.5 -48t-116 48t-48 116t48 116.5t116 48.5t116.5 -48.5t48.5 -116.5zM0 1469q57 -60 110.5 -104.5t121 -82t136 -63t166 -45.5
+t200 -31.5t250 -18.5t304 -9.5t372.5 -2.5q139 0 244.5 -5t181 -16.5t124 -27.5t71 -39.5t24 -51.5t-19.5 -64t-56.5 -76.5t-89.5 -91t-116 -104.5t-139 -119q-185 -157 -286 -247q29 51 76.5 109t94 105.5t94.5 98.5t83 91.5t54 80.5t13 70t-45.5 55.5t-116.5 41t-204 23.5
+t-304 5q-168 -2 -314 6t-256 23t-204.5 41t-159.5 51.5t-122.5 62.5t-91.5 66.5t-68 71.5t-50.5 69.5t-40 68t-36.5 59.5z" />
+    <glyph glyph-name="_539" unicode="&#xf23e;" horiz-adv-x="1792" 
+d="M896 1472q-169 0 -323 -66t-265.5 -177.5t-177.5 -265.5t-66 -323t66 -323t177.5 -265.5t265.5 -177.5t323 -66t323 66t265.5 177.5t177.5 265.5t66 323t-66 323t-177.5 265.5t-265.5 177.5t-323 66zM896 1536q182 0 348 -71t286 -191t191 -286t71 -348t-71 -348
+t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71zM496 704q16 0 16 -16v-480q0 -16 -16 -16h-32q-16 0 -16 16v480q0 16 16 16h32zM896 640q53 0 90.5 -37.5t37.5 -90.5q0 -35 -17.5 -64t-46.5 -46v-114q0 -14 -9 -23
+t-23 -9h-64q-14 0 -23 9t-9 23v114q-29 17 -46.5 46t-17.5 64q0 53 37.5 90.5t90.5 37.5zM896 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM544 928v-96
+q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v96q0 93 65.5 158.5t158.5 65.5t158.5 -65.5t65.5 -158.5v-96q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v96q0 146 -103 249t-249 103t-249 -103t-103 -249zM1408 192v512q0 26 -19 45t-45 19h-896q-26 0 -45 -19t-19 -45v-512
+q0 -26 19 -45t45 -19h896q26 0 45 19t19 45z" />
+    <glyph glyph-name="_540" unicode="&#xf240;" horiz-adv-x="2304" 
+d="M1920 1024v-768h-1664v768h1664zM2048 448h128v384h-128v288q0 14 -9 23t-23 9h-1856q-14 0 -23 -9t-9 -23v-960q0 -14 9 -23t23 -9h1856q14 0 23 9t9 23v288zM2304 832v-384q0 -53 -37.5 -90.5t-90.5 -37.5v-160q0 -66 -47 -113t-113 -47h-1856q-66 0 -113 47t-47 113
+v960q0 66 47 113t113 47h1856q66 0 113 -47t47 -113v-160q53 0 90.5 -37.5t37.5 -90.5z" />
+    <glyph glyph-name="_541" unicode="&#xf241;" horiz-adv-x="2304" 
+d="M256 256v768h1280v-768h-1280zM2176 960q53 0 90.5 -37.5t37.5 -90.5v-384q0 -53 -37.5 -90.5t-90.5 -37.5v-160q0 -66 -47 -113t-113 -47h-1856q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h1856q66 0 113 -47t47 -113v-160zM2176 448v384h-128v288q0 14 -9 23t-23 9
+h-1856q-14 0 -23 -9t-9 -23v-960q0 -14 9 -23t23 -9h1856q14 0 23 9t9 23v288h128z" />
+    <glyph glyph-name="_542" unicode="&#xf242;" horiz-adv-x="2304" 
+d="M256 256v768h896v-768h-896zM2176 960q53 0 90.5 -37.5t37.5 -90.5v-384q0 -53 -37.5 -90.5t-90.5 -37.5v-160q0 -66 -47 -113t-113 -47h-1856q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h1856q66 0 113 -47t47 -113v-160zM2176 448v384h-128v288q0 14 -9 23t-23 9
+h-1856q-14 0 -23 -9t-9 -23v-960q0 -14 9 -23t23 -9h1856q14 0 23 9t9 23v288h128z" />
+    <glyph glyph-name="_543" unicode="&#xf243;" horiz-adv-x="2304" 
+d="M256 256v768h512v-768h-512zM2176 960q53 0 90.5 -37.5t37.5 -90.5v-384q0 -53 -37.5 -90.5t-90.5 -37.5v-160q0 -66 -47 -113t-113 -47h-1856q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h1856q66 0 113 -47t47 -113v-160zM2176 448v384h-128v288q0 14 -9 23t-23 9
+h-1856q-14 0 -23 -9t-9 -23v-960q0 -14 9 -23t23 -9h1856q14 0 23 9t9 23v288h128z" />
+    <glyph glyph-name="_544" unicode="&#xf244;" horiz-adv-x="2304" 
+d="M2176 960q53 0 90.5 -37.5t37.5 -90.5v-384q0 -53 -37.5 -90.5t-90.5 -37.5v-160q0 -66 -47 -113t-113 -47h-1856q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h1856q66 0 113 -47t47 -113v-160zM2176 448v384h-128v288q0 14 -9 23t-23 9h-1856q-14 0 -23 -9t-9 -23
+v-960q0 -14 9 -23t23 -9h1856q14 0 23 9t9 23v288h128z" />
+    <glyph glyph-name="_545" unicode="&#xf245;" horiz-adv-x="1280" 
+d="M1133 493q31 -30 14 -69q-17 -40 -59 -40h-382l201 -476q10 -25 0 -49t-34 -35l-177 -75q-25 -10 -49 0t-35 34l-191 452l-312 -312q-19 -19 -45 -19q-12 0 -24 5q-40 17 -40 59v1504q0 42 40 59q12 5 24 5q27 0 45 -19z" />
+    <glyph glyph-name="_546" unicode="&#xf246;" horiz-adv-x="1024" 
+d="M832 1408q-320 0 -320 -224v-416h128v-128h-128v-544q0 -224 320 -224h64v-128h-64q-272 0 -384 146q-112 -146 -384 -146h-64v128h64q320 0 320 224v544h-128v128h128v416q0 224 -320 224h-64v128h64q272 0 384 -146q112 146 384 146h64v-128h-64z" />
+    <glyph glyph-name="_547" unicode="&#xf247;" horiz-adv-x="2048" 
+d="M2048 1152h-128v-1024h128v-384h-384v128h-1280v-128h-384v384h128v1024h-128v384h384v-128h1280v128h384v-384zM1792 1408v-128h128v128h-128zM128 1408v-128h128v128h-128zM256 -128v128h-128v-128h128zM1664 0v128h128v1024h-128v128h-1280v-128h-128v-1024h128v-128
+h1280zM1920 -128v128h-128v-128h128zM1280 896h384v-768h-896v256h-384v768h896v-256zM512 512h640v512h-640v-512zM1536 256v512h-256v-384h-384v-128h640z" />
+    <glyph glyph-name="_548" unicode="&#xf248;" horiz-adv-x="2304" 
+d="M2304 768h-128v-640h128v-384h-384v128h-896v-128h-384v384h128v128h-384v-128h-384v384h128v640h-128v384h384v-128h896v128h384v-384h-128v-128h384v128h384v-384zM2048 1024v-128h128v128h-128zM1408 1408v-128h128v128h-128zM128 1408v-128h128v128h-128zM256 256
+v128h-128v-128h128zM1536 384h-128v-128h128v128zM384 384h896v128h128v640h-128v128h-896v-128h-128v-640h128v-128zM896 -128v128h-128v-128h128zM2176 -128v128h-128v-128h128zM2048 128v640h-128v128h-384v-384h128v-384h-384v128h-384v-128h128v-128h896v128h128z" />
+    <glyph glyph-name="_549" unicode="&#xf249;" 
+d="M1024 288v-416h-928q-40 0 -68 28t-28 68v1344q0 40 28 68t68 28h1344q40 0 68 -28t28 -68v-928h-416q-40 0 -68 -28t-28 -68zM1152 256h381q-15 -82 -65 -132l-184 -184q-50 -50 -132 -65v381z" />
+    <glyph glyph-name="_550" unicode="&#xf24a;" 
+d="M1400 256h-248v-248q29 10 41 22l185 185q12 12 22 41zM1120 384h288v896h-1280v-1280h896v288q0 40 28 68t68 28zM1536 1312v-1024q0 -40 -20 -88t-48 -76l-184 -184q-28 -28 -76 -48t-88 -20h-1024q-40 0 -68 28t-28 68v1344q0 40 28 68t68 28h1344q40 0 68 -28t28 -68
+z" />
+    <glyph glyph-name="_551" unicode="&#xf24b;" horiz-adv-x="2304" 
+d="M1951 538q0 -26 -15.5 -44.5t-38.5 -23.5q-8 -2 -18 -2h-153v140h153q10 0 18 -2q23 -5 38.5 -23.5t15.5 -44.5zM1933 751q0 -25 -15 -42t-38 -21q-3 -1 -15 -1h-139v129h139q3 0 8.5 -0.5t6.5 -0.5q23 -4 38 -21.5t15 -42.5zM728 587v308h-228v-308q0 -58 -38 -94.5
+t-105 -36.5q-108 0 -229 59v-112q53 -15 121 -23t109 -9l42 -1q328 0 328 217zM1442 403v113q-99 -52 -200 -59q-108 -8 -169 41t-61 142t61 142t169 41q101 -7 200 -58v112q-48 12 -100 19.5t-80 9.5l-28 2q-127 6 -218.5 -14t-140.5 -60t-71 -88t-22 -106t22 -106t71 -88
+t140.5 -60t218.5 -14q101 4 208 31zM2176 518q0 54 -43 88.5t-109 39.5v3q57 8 89 41.5t32 79.5q0 55 -41 88t-107 36q-3 0 -12 0.5t-14 0.5h-455v-510h491q74 0 121.5 36.5t47.5 96.5zM2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90
+t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_552" unicode="&#xf24c;" horiz-adv-x="2304" 
+d="M858 295v693q-106 -41 -172 -135.5t-66 -211.5t66 -211.5t172 -134.5zM1362 641q0 117 -66 211.5t-172 135.5v-694q106 41 172 135.5t66 211.5zM1577 641q0 -159 -78.5 -294t-213.5 -213.5t-294 -78.5q-119 0 -227.5 46.5t-187 125t-125 187t-46.5 227.5q0 159 78.5 294
+t213.5 213.5t294 78.5t294 -78.5t213.5 -213.5t78.5 -294zM1960 634q0 139 -55.5 261.5t-147.5 205.5t-213.5 131t-252.5 48h-301q-176 0 -323.5 -81t-235 -230t-87.5 -335q0 -171 87 -317.5t236 -231.5t323 -85h301q129 0 251.5 50.5t214.5 135t147.5 202.5t55.5 246z
+M2304 1280v-1280q0 -52 -38 -90t-90 -38h-2048q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h2048q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_553" unicode="&#xf24d;" horiz-adv-x="1792" 
+d="M1664 -96v1088q0 13 -9.5 22.5t-22.5 9.5h-1088q-13 0 -22.5 -9.5t-9.5 -22.5v-1088q0 -13 9.5 -22.5t22.5 -9.5h1088q13 0 22.5 9.5t9.5 22.5zM1792 992v-1088q0 -66 -47 -113t-113 -47h-1088q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1088q66 0 113 -47t47 -113
+zM1408 1376v-160h-128v160q0 13 -9.5 22.5t-22.5 9.5h-1088q-13 0 -22.5 -9.5t-9.5 -22.5v-1088q0 -13 9.5 -22.5t22.5 -9.5h160v-128h-160q-66 0 -113 47t-47 113v1088q0 66 47 113t113 47h1088q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="_554" unicode="&#xf24e;" horiz-adv-x="2304" 
+d="M1728 1088l-384 -704h768zM448 1088l-384 -704h768zM1269 1280q-14 -40 -45.5 -71.5t-71.5 -45.5v-1291h608q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1344q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h608v1291q-40 14 -71.5 45.5t-45.5 71.5h-491q-14 0 -23 9t-9 23v64
+q0 14 9 23t23 9h491q21 57 70 92.5t111 35.5t111 -35.5t70 -92.5h491q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-491zM1088 1264q33 0 56.5 23.5t23.5 56.5t-23.5 56.5t-56.5 23.5t-56.5 -23.5t-23.5 -56.5t23.5 -56.5t56.5 -23.5zM2176 384q0 -73 -46.5 -131t-117.5 -91
+t-144.5 -49.5t-139.5 -16.5t-139.5 16.5t-144.5 49.5t-117.5 91t-46.5 131q0 11 35 81t92 174.5t107 195.5t102 184t56 100q18 33 56 33t56 -33q4 -7 56 -100t102 -184t107 -195.5t92 -174.5t35 -81zM896 384q0 -73 -46.5 -131t-117.5 -91t-144.5 -49.5t-139.5 -16.5
+t-139.5 16.5t-144.5 49.5t-117.5 91t-46.5 131q0 11 35 81t92 174.5t107 195.5t102 184t56 100q18 33 56 33t56 -33q4 -7 56 -100t102 -184t107 -195.5t92 -174.5t35 -81z" />
+    <glyph glyph-name="_555" unicode="&#xf250;" 
+d="M1408 1408q0 -261 -106.5 -461.5t-266.5 -306.5q160 -106 266.5 -306.5t106.5 -461.5h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1472q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96q0 261 106.5 461.5t266.5 306.5q-160 106 -266.5 306.5t-106.5 461.5h-96q-14 0 -23 9
+t-9 23v64q0 14 9 23t23 9h1472q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96zM874 700q77 29 149 92.5t129.5 152.5t92.5 210t35 253h-1024q0 -132 35 -253t92.5 -210t129.5 -152.5t149 -92.5q19 -7 30.5 -23.5t11.5 -36.5t-11.5 -36.5t-30.5 -23.5q-77 -29 -149 -92.5
+t-129.5 -152.5t-92.5 -210t-35 -253h1024q0 132 -35 253t-92.5 210t-129.5 152.5t-149 92.5q-19 7 -30.5 23.5t-11.5 36.5t11.5 36.5t30.5 23.5z" />
+    <glyph glyph-name="_556" unicode="&#xf251;" 
+d="M1408 1408q0 -261 -106.5 -461.5t-266.5 -306.5q160 -106 266.5 -306.5t106.5 -461.5h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1472q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96q0 261 106.5 461.5t266.5 306.5q-160 106 -266.5 306.5t-106.5 461.5h-96q-14 0 -23 9
+t-9 23v64q0 14 9 23t23 9h1472q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96zM1280 1408h-1024q0 -66 9 -128h1006q9 61 9 128zM1280 -128q0 130 -34 249.5t-90.5 208t-126.5 152t-146 94.5h-230q-76 -31 -146 -94.5t-126.5 -152t-90.5 -208t-34 -249.5h1024z" />
+    <glyph glyph-name="_557" unicode="&#xf252;" 
+d="M1408 1408q0 -261 -106.5 -461.5t-266.5 -306.5q160 -106 266.5 -306.5t106.5 -461.5h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1472q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96q0 261 106.5 461.5t266.5 306.5q-160 106 -266.5 306.5t-106.5 461.5h-96q-14 0 -23 9
+t-9 23v64q0 14 9 23t23 9h1472q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96zM1280 1408h-1024q0 -206 85 -384h854q85 178 85 384zM1223 192q-54 141 -145.5 241.5t-194.5 142.5h-230q-103 -42 -194.5 -142.5t-145.5 -241.5h910z" />
+    <glyph glyph-name="_558" unicode="&#xf253;" 
+d="M1408 1408q0 -261 -106.5 -461.5t-266.5 -306.5q160 -106 266.5 -306.5t106.5 -461.5h96q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-1472q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96q0 261 106.5 461.5t266.5 306.5q-160 106 -266.5 306.5t-106.5 461.5h-96q-14 0 -23 9
+t-9 23v64q0 14 9 23t23 9h1472q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-96zM874 700q77 29 149 92.5t129.5 152.5t92.5 210t35 253h-1024q0 -132 35 -253t92.5 -210t129.5 -152.5t149 -92.5q19 -7 30.5 -23.5t11.5 -36.5t-11.5 -36.5t-30.5 -23.5q-137 -51 -244 -196
+h700q-107 145 -244 196q-19 7 -30.5 23.5t-11.5 36.5t11.5 36.5t30.5 23.5z" />
+    <glyph glyph-name="_559" unicode="&#xf254;" 
+d="M1504 -64q14 0 23 -9t9 -23v-128q0 -14 -9 -23t-23 -9h-1472q-14 0 -23 9t-9 23v128q0 14 9 23t23 9h1472zM130 0q3 55 16 107t30 95t46 87t53.5 76t64.5 69.5t66 60t70.5 55t66.5 47.5t65 43q-43 28 -65 43t-66.5 47.5t-70.5 55t-66 60t-64.5 69.5t-53.5 76t-46 87
+t-30 95t-16 107h1276q-3 -55 -16 -107t-30 -95t-46 -87t-53.5 -76t-64.5 -69.5t-66 -60t-70.5 -55t-66.5 -47.5t-65 -43q43 -28 65 -43t66.5 -47.5t70.5 -55t66 -60t64.5 -69.5t53.5 -76t46 -87t30 -95t16 -107h-1276zM1504 1536q14 0 23 -9t9 -23v-128q0 -14 -9 -23t-23 -9
+h-1472q-14 0 -23 9t-9 23v128q0 14 9 23t23 9h1472z" />
+    <glyph glyph-name="_560" unicode="&#xf255;" 
+d="M768 1152q-53 0 -90.5 -37.5t-37.5 -90.5v-128h-32v93q0 48 -32 81.5t-80 33.5q-46 0 -79 -33t-33 -79v-429l-32 30v172q0 48 -32 81.5t-80 33.5q-46 0 -79 -33t-33 -79v-224q0 -47 35 -82l310 -296q39 -39 39 -102q0 -26 19 -45t45 -19h640q26 0 45 19t19 45v25
+q0 41 10 77l108 436q10 36 10 77v246q0 48 -32 81.5t-80 33.5q-46 0 -79 -33t-33 -79v-32h-32v125q0 40 -25 72.5t-64 40.5q-14 2 -23 2q-46 0 -79 -33t-33 -79v-128h-32v122q0 51 -32.5 89.5t-82.5 43.5q-5 1 -13 1zM768 1280q84 0 149 -50q57 34 123 34q59 0 111 -27
+t86 -76q27 7 59 7q100 0 170 -71.5t70 -171.5v-246q0 -51 -13 -108l-109 -436q-6 -24 -6 -71q0 -80 -56 -136t-136 -56h-640q-84 0 -138 58.5t-54 142.5l-308 296q-76 73 -76 175v224q0 99 70.5 169.5t169.5 70.5q11 0 16 -1q6 95 75.5 160t164.5 65q52 0 98 -21
+q72 69 174 69z" />
+    <glyph glyph-name="_561" unicode="&#xf256;" horiz-adv-x="1792" 
+d="M880 1408q-46 0 -79 -33t-33 -79v-656h-32v528q0 46 -33 79t-79 33t-79 -33t-33 -79v-528v-256l-154 205q-38 51 -102 51q-53 0 -90.5 -37.5t-37.5 -90.5q0 -43 26 -77l384 -512q38 -51 102 -51h688q34 0 61 22t34 56l76 405q5 32 5 59v498q0 46 -33 79t-79 33t-79 -33
+t-33 -79v-272h-32v528q0 46 -33 79t-79 33t-79 -33t-33 -79v-528h-32v656q0 46 -33 79t-79 33zM880 1536q68 0 125.5 -35.5t88.5 -96.5q19 4 42 4q99 0 169.5 -70.5t70.5 -169.5v-17q105 6 180.5 -64t75.5 -175v-498q0 -40 -8 -83l-76 -404q-14 -79 -76.5 -131t-143.5 -52
+h-688q-60 0 -114.5 27.5t-90.5 74.5l-384 512q-51 68 -51 154q0 106 75 181t181 75q78 0 128 -34v434q0 99 70.5 169.5t169.5 70.5q23 0 42 -4q31 61 88.5 96.5t125.5 35.5z" />
+    <glyph glyph-name="_562" unicode="&#xf257;" horiz-adv-x="1792" 
+d="M1073 -128h-177q-163 0 -226 141q-23 49 -23 102v5q-62 30 -98.5 88.5t-36.5 127.5q0 38 5 48h-261q-106 0 -181 75t-75 181t75 181t181 75h113l-44 17q-74 28 -119.5 93.5t-45.5 145.5q0 106 75 181t181 75q46 0 91 -17l628 -239h401q106 0 181 -75t75 -181v-668
+q0 -88 -54 -157.5t-140 -90.5l-339 -85q-92 -23 -186 -23zM1024 583l-155 -71l-163 -74q-30 -14 -48 -41.5t-18 -60.5q0 -46 33 -79t79 -33q26 0 46 10l338 154q-49 10 -80.5 50t-31.5 90v55zM1344 272q0 46 -33 79t-79 33q-26 0 -46 -10l-290 -132q-28 -13 -37 -17
+t-30.5 -17t-29.5 -23.5t-16 -29t-8 -40.5q0 -50 31.5 -82t81.5 -32q20 0 38 9l352 160q30 14 48 41.5t18 60.5zM1112 1024l-650 248q-24 8 -46 8q-53 0 -90.5 -37.5t-37.5 -90.5q0 -40 22.5 -73t59.5 -47l526 -200v-64h-640q-53 0 -90.5 -37.5t-37.5 -90.5t37.5 -90.5
+t90.5 -37.5h535l233 106v198q0 63 46 106l111 102h-69zM1073 0q82 0 155 19l339 85q43 11 70 45.5t27 78.5v668q0 53 -37.5 90.5t-90.5 37.5h-308l-136 -126q-36 -33 -36 -82v-296q0 -46 33 -77t79 -31t79 35t33 81v208h32v-208q0 -70 -57 -114q52 -8 86.5 -48.5t34.5 -93.5
+q0 -42 -23 -78t-61 -53l-310 -141h91z" />
+    <glyph glyph-name="_563" unicode="&#xf258;" horiz-adv-x="2048" 
+d="M1151 1536q61 0 116 -28t91 -77l572 -781q118 -159 118 -359v-355q0 -80 -56 -136t-136 -56h-384q-80 0 -136 56t-56 136v177l-286 143h-546q-80 0 -136 56t-56 136v32q0 119 84.5 203.5t203.5 84.5h420l42 128h-686q-100 0 -173.5 67.5t-81.5 166.5q-65 79 -65 182v32
+q0 80 56 136t136 56h959zM1920 -64v355q0 157 -93 284l-573 781q-39 52 -103 52h-959q-26 0 -45 -19t-19 -45q0 -32 1.5 -49.5t9.5 -40.5t25 -43q10 31 35.5 50t56.5 19h832v-32h-832q-26 0 -45 -19t-19 -45q0 -44 3 -58q8 -44 44 -73t81 -29h640h91q40 0 68 -28t28 -68
+q0 -15 -5 -30l-64 -192q-10 -29 -35 -47.5t-56 -18.5h-443q-66 0 -113 -47t-47 -113v-32q0 -26 19 -45t45 -19h561q16 0 29 -7l317 -158q24 -13 38.5 -36t14.5 -50v-197q0 -26 19 -45t45 -19h384q26 0 45 19t19 45z" />
+    <glyph glyph-name="_564" unicode="&#xf259;" horiz-adv-x="2048" 
+d="M459 -256q-77 0 -137.5 47.5t-79.5 122.5l-101 401q-13 57 -13 108q0 45 -5 67l-116 477q-7 27 -7 57q0 93 62 161t155 78q17 85 82.5 139t152.5 54q83 0 148 -51.5t85 -132.5l83 -348l103 428q20 81 85 132.5t148 51.5q89 0 155.5 -57.5t80.5 -144.5q92 -10 152 -79
+t60 -162q0 -24 -7 -59l-123 -512q10 7 37.5 28.5t38.5 29.5t35 23t41 20.5t41.5 11t49.5 5.5q105 0 180 -74t75 -179q0 -62 -28.5 -118t-78.5 -94l-507 -380q-68 -51 -153 -51h-694zM1104 1408q-38 0 -68.5 -24t-39.5 -62l-164 -682h-127l-145 602q-9 38 -39.5 62t-68.5 24
+q-48 0 -80 -33t-32 -80q0 -15 3 -28l132 -547h-26l-99 408q-9 37 -40 62.5t-69 25.5q-47 0 -80 -33t-33 -79q0 -14 3 -26l116 -478q7 -28 9 -86t10 -88l100 -401q8 -32 34 -52.5t59 -20.5h694q42 0 76 26l507 379q56 43 56 110q0 52 -37.5 88.5t-89.5 36.5q-43 0 -77 -26
+l-307 -230v227q0 4 32 138t68 282t39 161q4 18 4 29q0 47 -32 81t-79 34q-39 0 -69.5 -24t-39.5 -62l-116 -482h-26l150 624q3 14 3 28q0 48 -31.5 82t-79.5 34z" />
+    <glyph glyph-name="_565" unicode="&#xf25a;" horiz-adv-x="1792" 
+d="M640 1408q-53 0 -90.5 -37.5t-37.5 -90.5v-512v-384l-151 202q-41 54 -107 54q-52 0 -89 -38t-37 -90q0 -43 26 -77l384 -512q38 -51 102 -51h718q22 0 39.5 13.5t22.5 34.5l92 368q24 96 24 194v217q0 41 -28 71t-68 30t-68 -28t-28 -68h-32v61q0 48 -32 81.5t-80 33.5
+q-46 0 -79 -33t-33 -79v-64h-32v90q0 55 -37 94.5t-91 39.5q-53 0 -90.5 -37.5t-37.5 -90.5v-96h-32v570q0 55 -37 94.5t-91 39.5zM640 1536q107 0 181.5 -77.5t74.5 -184.5v-220q22 2 32 2q99 0 173 -69q47 21 99 21q113 0 184 -87q27 7 56 7q94 0 159 -67.5t65 -161.5
+v-217q0 -116 -28 -225l-92 -368q-16 -64 -68 -104.5t-118 -40.5h-718q-60 0 -114.5 27.5t-90.5 74.5l-384 512q-51 68 -51 154q0 105 74.5 180.5t179.5 75.5q71 0 130 -35v547q0 106 75 181t181 75zM768 128v384h-32v-384h32zM1024 128v384h-32v-384h32zM1280 128v384h-32
+v-384h32z" />
+    <glyph glyph-name="_566" unicode="&#xf25b;" 
+d="M1288 889q60 0 107 -23q141 -63 141 -226v-177q0 -94 -23 -186l-85 -339q-21 -86 -90.5 -140t-157.5 -54h-668q-106 0 -181 75t-75 181v401l-239 628q-17 45 -17 91q0 106 75 181t181 75q80 0 145.5 -45.5t93.5 -119.5l17 -44v113q0 106 75 181t181 75t181 -75t75 -181
+v-261q27 5 48 5q69 0 127.5 -36.5t88.5 -98.5zM1072 896q-33 0 -60.5 -18t-41.5 -48l-74 -163l-71 -155h55q50 0 90 -31.5t50 -80.5l154 338q10 20 10 46q0 46 -33 79t-79 33zM1293 761q-22 0 -40.5 -8t-29 -16t-23.5 -29.5t-17 -30.5t-17 -37l-132 -290q-10 -20 -10 -46
+q0 -46 33 -79t79 -33q33 0 60.5 18t41.5 48l160 352q9 18 9 38q0 50 -32 81.5t-82 31.5zM128 1120q0 -22 8 -46l248 -650v-69l102 111q43 46 106 46h198l106 233v535q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5v-640h-64l-200 526q-14 37 -47 59.5t-73 22.5
+q-53 0 -90.5 -37.5t-37.5 -90.5zM1180 -128q44 0 78.5 27t45.5 70l85 339q19 73 19 155v91l-141 -310q-17 -38 -53 -61t-78 -23q-53 0 -93.5 34.5t-48.5 86.5q-44 -57 -114 -57h-208v32h208q46 0 81 33t35 79t-31 79t-77 33h-296q-49 0 -82 -36l-126 -136v-308
+q0 -53 37.5 -90.5t90.5 -37.5h668z" />
+    <glyph glyph-name="_567" unicode="&#xf25c;" horiz-adv-x="1973" 
+d="M857 992v-117q0 -13 -9.5 -22t-22.5 -9h-298v-812q0 -13 -9 -22.5t-22 -9.5h-135q-13 0 -22.5 9t-9.5 23v812h-297q-13 0 -22.5 9t-9.5 22v117q0 14 9 23t23 9h793q13 0 22.5 -9.5t9.5 -22.5zM1895 995l77 -961q1 -13 -8 -24q-10 -10 -23 -10h-134q-12 0 -21 8.5
+t-10 20.5l-46 588l-189 -425q-8 -19 -29 -19h-120q-20 0 -29 19l-188 427l-45 -590q-1 -12 -10 -20.5t-21 -8.5h-135q-13 0 -23 10q-9 10 -9 24l78 961q1 12 10 20.5t21 8.5h142q20 0 29 -19l220 -520q10 -24 20 -51q3 7 9.5 24.5t10.5 26.5l221 520q9 19 29 19h141
+q13 0 22 -8.5t10 -20.5z" />
+    <glyph glyph-name="_568" unicode="&#xf25d;" horiz-adv-x="1792" 
+d="M1042 833q0 88 -60 121q-33 18 -117 18h-123v-281h162q66 0 102 37t36 105zM1094 548l205 -373q8 -17 -1 -31q-8 -16 -27 -16h-152q-20 0 -28 17l-194 365h-155v-350q0 -14 -9 -23t-23 -9h-134q-14 0 -23 9t-9 23v960q0 14 9 23t23 9h294q128 0 190 -24q85 -31 134 -109
+t49 -180q0 -92 -42.5 -165.5t-115.5 -109.5q6 -10 9 -16zM896 1376q-150 0 -286 -58.5t-234.5 -157t-157 -234.5t-58.5 -286t58.5 -286t157 -234.5t234.5 -157t286 -58.5t286 58.5t234.5 157t157 234.5t58.5 286t-58.5 286t-157 234.5t-234.5 157t-286 58.5zM1792 640
+q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="_569" unicode="&#xf25e;" horiz-adv-x="1792" 
+d="M605 303q153 0 257 104q14 18 3 36l-45 82q-6 13 -24 17q-16 2 -27 -11l-4 -3q-4 -4 -11.5 -10t-17.5 -13.5t-23.5 -14.5t-28.5 -13t-33.5 -9.5t-37.5 -3.5q-76 0 -125 50t-49 127q0 76 48 125.5t122 49.5q37 0 71.5 -14t50.5 -28l16 -14q11 -11 26 -10q16 2 24 14l53 78
+q13 20 -2 39q-3 4 -11 12t-30 23.5t-48.5 28t-67.5 22.5t-86 10q-148 0 -246 -96.5t-98 -240.5q0 -146 97 -241.5t247 -95.5zM1235 303q153 0 257 104q14 18 4 36l-45 82q-8 14 -25 17q-16 2 -27 -11l-4 -3q-4 -4 -11.5 -10t-17.5 -13.5t-23.5 -14.5t-28.5 -13t-33.5 -9.5
+t-37.5 -3.5q-76 0 -125 50t-49 127q0 76 48 125.5t122 49.5q37 0 71.5 -14t50.5 -28l16 -14q11 -11 26 -10q16 2 24 14l53 78q13 20 -2 39q-3 4 -11 12t-30 23.5t-48.5 28t-67.5 22.5t-86 10q-147 0 -245.5 -96.5t-98.5 -240.5q0 -146 97 -241.5t247 -95.5zM896 1376
+q-150 0 -286 -58.5t-234.5 -157t-157 -234.5t-58.5 -286t58.5 -286t157 -234.5t234.5 -157t286 -58.5t286 58.5t234.5 157t157 234.5t58.5 286t-58.5 286t-157 234.5t-234.5 157t-286 58.5zM896 1536q182 0 348 -71t286 -191t191 -286t71 -348t-71 -348t-191 -286t-286 -191
+t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71z" />
+    <glyph glyph-name="f260" unicode="&#xf260;" horiz-adv-x="2048" 
+d="M736 736l384 -384l-384 -384l-672 672l672 672l168 -168l-96 -96l-72 72l-480 -480l480 -480l193 193l-289 287zM1312 1312l672 -672l-672 -672l-168 168l96 96l72 -72l480 480l-480 480l-193 -193l289 -287l-96 -96l-384 384z" />
+    <glyph glyph-name="f261" unicode="&#xf261;" horiz-adv-x="1792" 
+d="M717 182l271 271l-279 279l-88 -88l192 -191l-96 -96l-279 279l279 279l40 -40l87 87l-127 128l-454 -454zM1075 190l454 454l-454 454l-271 -271l279 -279l88 88l-192 191l96 96l279 -279l-279 -279l-40 40l-87 -88zM1792 640q0 -182 -71 -348t-191 -286t-286 -191
+t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="_572" unicode="&#xf262;" horiz-adv-x="2304" 
+d="M651 539q0 -39 -27.5 -66.5t-65.5 -27.5q-39 0 -66.5 27.5t-27.5 66.5q0 38 27.5 65.5t66.5 27.5q38 0 65.5 -27.5t27.5 -65.5zM1805 540q0 -39 -27.5 -66.5t-66.5 -27.5t-66.5 27.5t-27.5 66.5t27.5 66t66.5 27t66.5 -27t27.5 -66zM765 539q0 79 -56.5 136t-136.5 57
+t-136.5 -56.5t-56.5 -136.5t56.5 -136.5t136.5 -56.5t136.5 56.5t56.5 136.5zM1918 540q0 80 -56.5 136.5t-136.5 56.5q-79 0 -136 -56.5t-57 -136.5t56.5 -136.5t136.5 -56.5t136.5 56.5t56.5 136.5zM850 539q0 -116 -81.5 -197.5t-196.5 -81.5q-116 0 -197.5 82t-81.5 197
+t82 196.5t197 81.5t196.5 -81.5t81.5 -196.5zM2004 540q0 -115 -81.5 -196.5t-197.5 -81.5q-115 0 -196.5 81.5t-81.5 196.5t81.5 196.5t196.5 81.5q116 0 197.5 -81.5t81.5 -196.5zM1040 537q0 191 -135.5 326.5t-326.5 135.5q-125 0 -231 -62t-168 -168.5t-62 -231.5
+t62 -231.5t168 -168.5t231 -62q191 0 326.5 135.5t135.5 326.5zM1708 1110q-254 111 -556 111q-319 0 -573 -110q117 0 223 -45.5t182.5 -122.5t122 -183t45.5 -223q0 115 43.5 219.5t118 180.5t177.5 123t217 50zM2187 537q0 191 -135 326.5t-326 135.5t-326.5 -135.5
+t-135.5 -326.5t135.5 -326.5t326.5 -135.5t326 135.5t135 326.5zM1921 1103h383q-44 -51 -75 -114.5t-40 -114.5q110 -151 110 -337q0 -156 -77 -288t-209 -208.5t-287 -76.5q-133 0 -249 56t-196 155q-47 -56 -129 -179q-11 22 -53.5 82.5t-74.5 97.5
+q-80 -99 -196.5 -155.5t-249.5 -56.5q-155 0 -287 76.5t-209 208.5t-77 288q0 186 110 337q-9 51 -40 114.5t-75 114.5h365q149 100 355 156.5t432 56.5q224 0 421 -56t348 -157z" />
+    <glyph glyph-name="f263" unicode="&#xf263;" horiz-adv-x="1280" 
+d="M640 629q-188 0 -321 133t-133 320q0 188 133 321t321 133t321 -133t133 -321q0 -187 -133 -320t-321 -133zM640 1306q-92 0 -157.5 -65.5t-65.5 -158.5q0 -92 65.5 -157.5t157.5 -65.5t157.5 65.5t65.5 157.5q0 93 -65.5 158.5t-157.5 65.5zM1163 574q13 -27 15 -49.5
+t-4.5 -40.5t-26.5 -38.5t-42.5 -37t-61.5 -41.5q-115 -73 -315 -94l73 -72l267 -267q30 -31 30 -74t-30 -73l-12 -13q-31 -30 -74 -30t-74 30q-67 68 -267 268l-267 -268q-31 -30 -74 -30t-73 30l-12 13q-31 30 -31 73t31 74l267 267l72 72q-203 21 -317 94
+q-39 25 -61.5 41.5t-42.5 37t-26.5 38.5t-4.5 40.5t15 49.5q10 20 28 35t42 22t56 -2t65 -35q5 -4 15 -11t43 -24.5t69 -30.5t92 -24t113 -11q91 0 174 25.5t120 50.5l38 25q33 26 65 35t56 2t42 -22t28 -35z" />
+    <glyph glyph-name="_574" unicode="&#xf264;" 
+d="M927 956q0 -66 -46.5 -112.5t-112.5 -46.5t-112.5 46.5t-46.5 112.5t46.5 112.5t112.5 46.5t112.5 -46.5t46.5 -112.5zM1141 593q-10 20 -28 32t-47.5 9.5t-60.5 -27.5q-10 -8 -29 -20t-81 -32t-127 -20t-124 18t-86 36l-27 18q-31 25 -60.5 27.5t-47.5 -9.5t-28 -32
+q-22 -45 -2 -74.5t87 -73.5q83 -53 226 -67l-51 -52q-142 -142 -191 -190q-22 -22 -22 -52.5t22 -52.5l9 -9q22 -22 52.5 -22t52.5 22l191 191q114 -115 191 -191q22 -22 52.5 -22t52.5 22l9 9q22 22 22 52.5t-22 52.5l-191 190l-52 52q141 14 225 67q67 44 87 73.5t-2 74.5
+zM1092 956q0 134 -95 229t-229 95t-229 -95t-95 -229t95 -229t229 -95t229 95t95 229zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="_575" unicode="&#xf265;" horiz-adv-x="1720" 
+d="M1565 1408q65 0 110 -45.5t45 -110.5v-519q0 -176 -68 -336t-182.5 -275t-274 -182.5t-334.5 -67.5q-176 0 -335.5 67.5t-274.5 182.5t-183 275t-68 336v519q0 64 46 110t110 46h1409zM861 344q47 0 82 33l404 388q37 35 37 85q0 49 -34.5 83.5t-83.5 34.5q-47 0 -82 -33
+l-323 -310l-323 310q-35 33 -81 33q-49 0 -83.5 -34.5t-34.5 -83.5q0 -51 36 -85l405 -388q33 -33 81 -33z" />
+    <glyph glyph-name="_576" unicode="&#xf266;" horiz-adv-x="2304" 
+d="M1494 -103l-295 695q-25 -49 -158.5 -305.5t-198.5 -389.5q-1 -1 -27.5 -0.5t-26.5 1.5q-82 193 -255.5 587t-259.5 596q-21 50 -66.5 107.5t-103.5 100.5t-102 43q0 5 -0.5 24t-0.5 27h583v-50q-39 -2 -79.5 -16t-66.5 -43t-10 -64q26 -59 216.5 -499t235.5 -540
+q31 61 140 266.5t131 247.5q-19 39 -126 281t-136 295q-38 69 -201 71v50l513 -1v-47q-60 -2 -93.5 -25t-12.5 -69q33 -70 87 -189.5t86 -187.5q110 214 173 363q24 55 -10 79.5t-129 26.5q1 7 1 25v24q64 0 170.5 0.5t180 1t92.5 0.5v-49q-62 -2 -119 -33t-90 -81
+l-213 -442q13 -33 127.5 -290t121.5 -274l441 1017q-14 38 -49.5 62.5t-65 31.5t-55.5 8v50l460 -4l1 -2l-1 -44q-139 -4 -201 -145q-526 -1216 -559 -1291h-49z" />
+    <glyph glyph-name="_577" unicode="&#xf267;" horiz-adv-x="1792" 
+d="M949 643q0 -26 -16.5 -45t-41.5 -19q-26 0 -45 16.5t-19 41.5q0 26 17 45t42 19t44 -16.5t19 -41.5zM964 585l350 581q-9 -8 -67.5 -62.5t-125.5 -116.5t-136.5 -127t-117 -110.5t-50.5 -51.5l-349 -580q7 7 67 62t126 116.5t136 127t117 111t50 50.5zM1611 640
+q0 -201 -104 -371q-3 2 -17 11t-26.5 16.5t-16.5 7.5q-13 0 -13 -13q0 -10 59 -44q-74 -112 -184.5 -190.5t-241.5 -110.5l-16 67q-1 10 -15 10q-5 0 -8 -5.5t-2 -9.5l16 -68q-72 -15 -146 -15q-199 0 -372 105q1 2 13 20.5t21.5 33.5t9.5 19q0 13 -13 13q-6 0 -17 -14.5
+t-22.5 -34.5t-13.5 -23q-113 75 -192 187.5t-110 244.5l69 15q10 3 10 15q0 5 -5.5 8t-10.5 2l-68 -15q-14 72 -14 139q0 206 109 379q2 -1 18.5 -12t30 -19t17.5 -8q13 0 13 12q0 6 -12.5 15.5t-32.5 21.5l-20 12q77 112 189 189t244 107l15 -67q2 -10 15 -10q5 0 8 5.5
+t2 10.5l-15 66q71 13 134 13q204 0 379 -109q-39 -56 -39 -65q0 -13 12 -13q11 0 48 64q111 -75 187.5 -186t107.5 -241l-56 -12q-10 -2 -10 -16q0 -5 5.5 -8t9.5 -2l57 13q14 -72 14 -140zM1696 640q0 163 -63.5 311t-170.5 255t-255 170.5t-311 63.5t-311 -63.5
+t-255 -170.5t-170.5 -255t-63.5 -311t63.5 -311t170.5 -255t255 -170.5t311 -63.5t311 63.5t255 170.5t170.5 255t63.5 311zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191
+t191 -286t71 -348z" />
+    <glyph glyph-name="_578" unicode="&#xf268;" horiz-adv-x="1792" 
+d="M893 1536q240 2 451 -120q232 -134 352 -372l-742 39q-160 9 -294 -74.5t-185 -229.5l-276 424q128 159 311 245.5t383 87.5zM146 1131l337 -663q72 -143 211 -217t293 -45l-230 -451q-212 33 -385 157.5t-272.5 316t-99.5 411.5q0 267 146 491zM1732 962
+q58 -150 59.5 -310.5t-48.5 -306t-153 -272t-246 -209.5q-230 -133 -498 -119l405 623q88 131 82.5 290.5t-106.5 277.5zM896 942q125 0 213.5 -88.5t88.5 -213.5t-88.5 -213.5t-213.5 -88.5t-213.5 88.5t-88.5 213.5t88.5 213.5t213.5 88.5z" />
+    <glyph glyph-name="_579" unicode="&#xf269;" horiz-adv-x="1792" 
+d="M903 -256q-283 0 -504.5 150.5t-329.5 398.5q-58 131 -67 301t26 332.5t111 312t179 242.5l-11 -281q11 14 68 15.5t70 -15.5q42 81 160.5 138t234.5 59q-54 -45 -119.5 -148.5t-58.5 -163.5q25 -8 62.5 -13.5t63 -7.5t68 -4t50.5 -3q15 -5 9.5 -45.5t-30.5 -75.5
+q-5 -7 -16.5 -18.5t-56.5 -35.5t-101 -34l15 -189l-139 67q-18 -43 -7.5 -81.5t36 -66.5t65.5 -41.5t81 -6.5q51 9 98 34.5t83.5 45t73.5 17.5q61 -4 89.5 -33t19.5 -65q-1 -2 -2.5 -5.5t-8.5 -12.5t-18 -15.5t-31.5 -10.5t-46.5 -1q-60 -95 -144.5 -135.5t-209.5 -29.5
+q74 -61 162.5 -82.5t168.5 -6t154.5 52t128 87.5t80.5 104q43 91 39 192.5t-37.5 188.5t-78.5 125q87 -38 137 -79.5t77 -112.5q15 170 -57.5 343t-209.5 284q265 -77 412 -279.5t151 -517.5q2 -127 -40.5 -255t-123.5 -238t-189 -196t-247.5 -135.5t-288.5 -49.5z" />
+    <glyph glyph-name="_580" unicode="&#xf26a;" horiz-adv-x="1792" 
+d="M1493 1308q-165 110 -359 110q-155 0 -293 -73t-240 -200q-75 -93 -119.5 -218t-48.5 -266v-42q4 -141 48.5 -266t119.5 -218q102 -127 240 -200t293 -73q194 0 359 110q-121 -108 -274.5 -168t-322.5 -60q-29 0 -43 1q-175 8 -333 82t-272 193t-181 281t-67 339
+q0 182 71 348t191 286t286 191t348 71h3q168 -1 320.5 -60.5t273.5 -167.5zM1792 640q0 -192 -77 -362.5t-213 -296.5q-104 -63 -222 -63q-137 0 -255 84q154 56 253.5 233t99.5 405q0 227 -99 404t-253 234q119 83 254 83q119 0 226 -65q135 -125 210.5 -295t75.5 -361z
+" />
+    <glyph glyph-name="_581" unicode="&#xf26b;" horiz-adv-x="1792" 
+d="M1792 599q0 -56 -7 -104h-1151q0 -146 109.5 -244.5t257.5 -98.5q99 0 185.5 46.5t136.5 130.5h423q-56 -159 -170.5 -281t-267.5 -188.5t-321 -66.5q-187 0 -356 83q-228 -116 -394 -116q-237 0 -237 263q0 115 45 275q17 60 109 229q199 360 475 606
+q-184 -79 -427 -354q63 274 283.5 449.5t501.5 175.5q30 0 45 -1q255 117 433 117q64 0 116 -13t94.5 -40.5t66.5 -76.5t24 -115q0 -116 -75 -286q101 -182 101 -390zM1722 1239q0 83 -53 132t-137 49q-108 0 -254 -70q121 -47 222.5 -131.5t170.5 -195.5q51 135 51 216z
+M128 2q0 -86 48.5 -132.5t134.5 -46.5q115 0 266 83q-122 72 -213.5 183t-137.5 245q-98 -205 -98 -332zM632 715h728q-5 142 -113 237t-251 95q-144 0 -251.5 -95t-112.5 -237z" />
+    <glyph glyph-name="_582" unicode="&#xf26c;" horiz-adv-x="2048" 
+d="M1792 288v960q0 13 -9.5 22.5t-22.5 9.5h-1600q-13 0 -22.5 -9.5t-9.5 -22.5v-960q0 -13 9.5 -22.5t22.5 -9.5h1600q13 0 22.5 9.5t9.5 22.5zM1920 1248v-960q0 -66 -47 -113t-113 -47h-736v-128h352q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-832q-14 0 -23 9t-9 23
+v64q0 14 9 23t23 9h352v128h-736q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h1600q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="_583" unicode="&#xf26d;" horiz-adv-x="1792" 
+d="M138 1408h197q-70 -64 -126 -149q-36 -56 -59 -115t-30 -125.5t-8.5 -120t10.5 -132t21 -126t28 -136.5q4 -19 6 -28q51 -238 81 -329q57 -171 152 -275h-272q-48 0 -82 34t-34 82v1304q0 48 34 82t82 34zM1346 1408h308q48 0 82 -34t34 -82v-1304q0 -48 -34 -82t-82 -34
+h-178q212 210 196 565l-469 -101q-2 -45 -12 -82t-31 -72t-59.5 -59.5t-93.5 -36.5q-123 -26 -199 40q-32 27 -53 61t-51.5 129t-64.5 258q-35 163 -45.5 263t-5.5 139t23 77q20 41 62.5 73t102.5 45q45 12 83.5 6.5t67 -17t54 -35t43 -48t34.5 -56.5l468 100
+q-68 175 -180 287z" />
+    <glyph glyph-name="_584" unicode="&#xf26e;" 
+d="M1401 -11l-6 -6q-113 -113 -259 -175q-154 -64 -317 -64q-165 0 -317 64q-148 63 -259 175q-113 112 -175 258q-42 103 -54 189q-4 28 48 36q51 8 56 -20q1 -1 1 -4q18 -90 46 -159q50 -124 152 -226q98 -98 226 -152q132 -56 276 -56q143 0 276 56q128 55 225 152l6 6
+q10 10 25 6q12 -3 33 -22q36 -37 17 -58zM929 604l-66 -66l63 -63q21 -21 -7 -49q-17 -17 -32 -17q-10 0 -19 10l-62 61l-66 -66q-5 -5 -15 -5q-15 0 -31 16l-2 2q-18 15 -18 29q0 7 8 17l66 65l-66 66q-16 16 14 45q18 18 31 18q6 0 13 -5l65 -66l65 65q18 17 48 -13
+q27 -27 11 -44zM1400 547q0 -118 -46 -228q-45 -105 -126 -186q-80 -80 -187 -126t-228 -46t-228 46t-187 126q-82 82 -125 186q-15 33 -15 40h-1q-9 27 43 44q50 16 60 -12q37 -99 97 -167h1v339v2q3 136 102 232q105 103 253 103q147 0 251 -103t104 -249
+q0 -147 -104.5 -251t-250.5 -104q-58 0 -112 16q-28 11 -13 61q16 51 44 43l14 -3q14 -3 33 -6t30 -3q104 0 176 71.5t72 174.5q0 101 -72 171q-71 71 -175 71q-107 0 -178 -80q-64 -72 -64 -160v-413q110 -67 242 -67q96 0 185 36.5t156 103.5t103.5 155t36.5 183
+q0 198 -141 339q-140 140 -339 140q-200 0 -340 -140q-53 -53 -77 -87l-2 -2q-8 -11 -13 -15.5t-21.5 -9.5t-38.5 3q-21 5 -36.5 16.5t-15.5 26.5v680q0 15 10.5 26.5t27.5 11.5h877q30 0 30 -55t-30 -55h-811v-483h1q40 42 102 84t108 61q109 46 231 46q121 0 228 -46
+t187 -126q81 -81 126 -186q46 -112 46 -229zM1369 1128q9 -8 9 -18t-5.5 -18t-16.5 -21q-26 -26 -39 -26q-9 0 -16 7q-106 91 -207 133q-128 56 -276 56q-133 0 -262 -49q-27 -10 -45 37q-9 25 -8 38q3 16 16 20q130 57 299 57q164 0 316 -64q137 -58 235 -152z" />
+    <glyph glyph-name="_585" unicode="&#xf270;" horiz-adv-x="1792" 
+d="M1551 60q15 6 26 3t11 -17.5t-15 -33.5q-13 -16 -44 -43.5t-95.5 -68t-141 -74t-188 -58t-229.5 -24.5q-119 0 -238 31t-209 76.5t-172.5 104t-132.5 105t-84 87.5q-8 9 -10 16.5t1 12t8 7t11.5 2t11.5 -4.5q192 -117 300 -166q389 -176 799 -90q190 40 391 135z
+M1758 175q11 -16 2.5 -69.5t-28.5 -102.5q-34 -83 -85 -124q-17 -14 -26 -9t0 24q21 45 44.5 121.5t6.5 98.5q-5 7 -15.5 11.5t-27 6t-29.5 2.5t-35 0t-31.5 -2t-31 -3t-22.5 -2q-6 -1 -13 -1.5t-11 -1t-8.5 -1t-7 -0.5h-5.5h-4.5t-3 0.5t-2 1.5l-1.5 3q-6 16 47 40t103 30
+q46 7 108 1t76 -24zM1364 618q0 -31 13.5 -64t32 -58t37.5 -46t33 -32l13 -11l-227 -224q-40 37 -79 75.5t-58 58.5l-19 20q-11 11 -25 33q-38 -59 -97.5 -102.5t-127.5 -63.5t-140 -23t-137.5 21t-117.5 65.5t-83 113t-31 162.5q0 84 28 154t72 116.5t106.5 83t122.5 57
+t130 34.5t119.5 18.5t99.5 6.5v127q0 65 -21 97q-34 53 -121 53q-6 0 -16.5 -1t-40.5 -12t-56 -29.5t-56 -59.5t-48 -96l-294 27q0 60 22 119t67 113t108 95t151.5 65.5t190.5 24.5q100 0 181 -25t129.5 -61.5t81 -83t45 -86t12.5 -73.5v-589zM692 597q0 -86 70 -133
+q66 -44 139 -22q84 25 114 123q14 45 14 101v162q-59 -2 -111 -12t-106.5 -33.5t-87 -71t-32.5 -114.5z" />
+    <glyph glyph-name="_586" unicode="&#xf271;" horiz-adv-x="1792" 
+d="M1536 1280q52 0 90 -38t38 -90v-1280q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h384v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h128zM1152 1376v-288q0 -14 9 -23t23 -9
+h64q14 0 23 9t9 23v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM384 1376v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23zM1536 -128v1024h-1408v-1024h1408zM896 448h224q14 0 23 -9t9 -23v-64q0 -14 -9 -23t-23 -9h-224
+v-224q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v224h-224q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h224v224q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-224z" />
+    <glyph glyph-name="_587" unicode="&#xf272;" horiz-adv-x="1792" 
+d="M1152 416v-64q0 -14 -9 -23t-23 -9h-576q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h576q14 0 23 -9t9 -23zM128 -128h1408v1024h-1408v-1024zM512 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1280 1088v288q0 14 -9 23
+t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1664 1152v-1280q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h384v96q0 66 47 113t113 47h64q66 0 113 -47
+t47 -113v-96h128q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_588" unicode="&#xf273;" horiz-adv-x="1792" 
+d="M1111 151l-46 -46q-9 -9 -22 -9t-23 9l-188 189l-188 -189q-10 -9 -23 -9t-22 9l-46 46q-9 9 -9 22t9 23l189 188l-189 188q-9 10 -9 23t9 22l46 46q9 9 22 9t23 -9l188 -188l188 188q10 9 23 9t22 -9l46 -46q9 -9 9 -22t-9 -23l-188 -188l188 -188q9 -10 9 -23t-9 -22z
+M128 -128h1408v1024h-1408v-1024zM512 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1280 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1664 1152v-1280
+q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h384v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h128q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_589" unicode="&#xf274;" horiz-adv-x="1792" 
+d="M1303 572l-512 -512q-10 -9 -23 -9t-23 9l-288 288q-9 10 -9 23t9 22l46 46q9 9 22 9t23 -9l220 -220l444 444q10 9 23 9t22 -9l46 -46q9 -9 9 -22t-9 -23zM128 -128h1408v1024h-1408v-1024zM512 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23
+t23 -9h64q14 0 23 9t9 23zM1280 1088v288q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-288q0 -14 9 -23t23 -9h64q14 0 23 9t9 23zM1664 1152v-1280q0 -52 -38 -90t-90 -38h-1408q-52 0 -90 38t-38 90v1280q0 52 38 90t90 38h128v96q0 66 47 113t113 47h64q66 0 113 -47
+t47 -113v-96h384v96q0 66 47 113t113 47h64q66 0 113 -47t47 -113v-96h128q52 0 90 -38t38 -90z" />
+    <glyph glyph-name="_590" unicode="&#xf275;" horiz-adv-x="1792" 
+d="M448 1536q26 0 45 -19t19 -45v-891l536 429q17 14 40 14q26 0 45 -19t19 -45v-379l536 429q17 14 40 14q26 0 45 -19t19 -45v-1152q0 -26 -19 -45t-45 -19h-1664q-26 0 -45 19t-19 45v1664q0 26 19 45t45 19h384z" />
+    <glyph glyph-name="_591" unicode="&#xf276;" horiz-adv-x="1024" 
+d="M512 448q66 0 128 15v-655q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v655q62 -15 128 -15zM512 1536q212 0 362 -150t150 -362t-150 -362t-362 -150t-362 150t-150 362t150 362t362 150zM512 1312q14 0 23 9t9 23t-9 23t-23 9q-146 0 -249 -103t-103 -249
+q0 -14 9 -23t23 -9t23 9t9 23q0 119 84.5 203.5t203.5 84.5z" />
+    <glyph glyph-name="_592" unicode="&#xf277;" horiz-adv-x="1792" 
+d="M1745 1239q10 -10 10 -23t-10 -23l-141 -141q-28 -28 -68 -28h-1344q-26 0 -45 19t-19 45v256q0 26 19 45t45 19h576v64q0 26 19 45t45 19h128q26 0 45 -19t19 -45v-64h512q40 0 68 -28zM768 320h256v-512q0 -26 -19 -45t-45 -19h-128q-26 0 -45 19t-19 45v512zM1600 768
+q26 0 45 -19t19 -45v-256q0 -26 -19 -45t-45 -19h-1344q-40 0 -68 28l-141 141q-10 10 -10 23t10 23l141 141q28 28 68 28h512v192h256v-192h576z" />
+    <glyph glyph-name="_593" unicode="&#xf278;" horiz-adv-x="2048" 
+d="M2020 1525q28 -20 28 -53v-1408q0 -20 -11 -36t-29 -23l-640 -256q-24 -11 -48 0l-616 246l-616 -246q-10 -5 -24 -5q-19 0 -36 11q-28 20 -28 53v1408q0 20 11 36t29 23l640 256q24 11 48 0l616 -246l616 246q32 13 60 -6zM736 1390v-1270l576 -230v1270zM128 1173
+v-1270l544 217v1270zM1920 107v1270l-544 -217v-1270z" />
+    <glyph glyph-name="_594" unicode="&#xf279;" horiz-adv-x="1792" 
+d="M512 1536q13 0 22.5 -9.5t9.5 -22.5v-1472q0 -20 -17 -28l-480 -256q-7 -4 -15 -4q-13 0 -22.5 9.5t-9.5 22.5v1472q0 20 17 28l480 256q7 4 15 4zM1760 1536q13 0 22.5 -9.5t9.5 -22.5v-1472q0 -20 -17 -28l-480 -256q-7 -4 -15 -4q-13 0 -22.5 9.5t-9.5 22.5v1472
+q0 20 17 28l480 256q7 4 15 4zM640 1536q8 0 14 -3l512 -256q18 -10 18 -29v-1472q0 -13 -9.5 -22.5t-22.5 -9.5q-8 0 -14 3l-512 256q-18 10 -18 29v1472q0 13 9.5 22.5t22.5 9.5z" />
+    <glyph glyph-name="_595" unicode="&#xf27a;" horiz-adv-x="1792" 
+d="M640 640q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1024 640q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1408 640q0 53 -37.5 90.5t-90.5 37.5
+t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5zM1792 640q0 -174 -120 -321.5t-326 -233t-450 -85.5q-110 0 -211 18q-173 -173 -435 -229q-52 -10 -86 -13q-12 -1 -22 6t-13 18q-4 15 20 37q5 5 23.5 21.5t25.5 23.5t23.5 25.5t24 31.5t20.5 37
+t20 48t14.5 57.5t12.5 72.5q-146 90 -229.5 216.5t-83.5 269.5q0 174 120 321.5t326 233t450 85.5t450 -85.5t326 -233t120 -321.5z" />
+    <glyph glyph-name="_596" unicode="&#xf27b;" horiz-adv-x="1792" 
+d="M640 640q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1024 640q0 -53 -37.5 -90.5t-90.5 -37.5t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM1408 640q0 -53 -37.5 -90.5t-90.5 -37.5
+t-90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5t90.5 -37.5t37.5 -90.5zM896 1152q-204 0 -381.5 -69.5t-282 -187.5t-104.5 -255q0 -112 71.5 -213.5t201.5 -175.5l87 -50l-27 -96q-24 -91 -70 -172q152 63 275 171l43 38l57 -6q69 -8 130 -8q204 0 381.5 69.5t282 187.5
+t104.5 255t-104.5 255t-282 187.5t-381.5 69.5zM1792 640q0 -174 -120 -321.5t-326 -233t-450 -85.5q-70 0 -145 8q-198 -175 -460 -242q-49 -14 -114 -22h-5q-15 0 -27 10.5t-16 27.5v1q-3 4 -0.5 12t2 10t4.5 9.5l6 9t7 8.5t8 9q7 8 31 34.5t34.5 38t31 39.5t32.5 51
+t27 59t26 76q-157 89 -247.5 220t-90.5 281q0 130 71 248.5t191 204.5t286 136.5t348 50.5t348 -50.5t286 -136.5t191 -204.5t71 -248.5z" />
+    <glyph glyph-name="_597" unicode="&#xf27c;" horiz-adv-x="1024" 
+d="M512 345l512 295v-591l-512 -296v592zM0 640v-591l512 296zM512 1527v-591l-512 -296v591zM512 936l512 295v-591z" />
+    <glyph glyph-name="_598" unicode="&#xf27d;" horiz-adv-x="1792" 
+d="M1709 1018q-10 -236 -332 -651q-333 -431 -562 -431q-142 0 -240 263q-44 160 -132 482q-72 262 -157 262q-18 0 -127 -76l-77 98q24 21 108 96.5t130 115.5q156 138 241 146q95 9 153 -55.5t81 -203.5q44 -287 66 -373q55 -249 120 -249q51 0 154 161q101 161 109 246
+q13 139 -109 139q-57 0 -121 -26q120 393 459 382q251 -8 236 -326z" />
+    <glyph glyph-name="f27e" unicode="&#xf27e;" 
+d="M0 1408h1536v-1536h-1536v1536zM1085 293l-221 631l221 297h-634l221 -297l-221 -631l317 -304z" />
+    <glyph glyph-name="uniF280" unicode="&#xf280;" 
+d="M0 1408h1536v-1536h-1536v1536zM908 1088l-12 -33l75 -83l-31 -114l25 -25l107 57l107 -57l25 25l-31 114l75 83l-12 33h-95l-53 96h-32l-53 -96h-95zM641 925q32 0 44.5 -16t11.5 -63l174 21q0 55 -17.5 92.5t-50.5 56t-69 25.5t-85 7q-133 0 -199 -57.5t-66 -182.5v-72
+h-96v-128h76q20 0 20 -8v-382q0 -14 -5 -20t-18 -7l-73 -7v-88h448v86l-149 14q-6 1 -8.5 1.5t-3.5 2.5t-0.5 4t1 7t0.5 10v387h191l38 128h-231q-6 0 -2 6t4 9v80q0 27 1.5 40.5t7.5 28t19.5 20t36.5 5.5zM1248 96v86l-54 9q-7 1 -9.5 2.5t-2.5 3t1 7.5t1 12v520h-275
+l-23 -101l83 -22q23 -7 23 -27v-370q0 -14 -6 -18.5t-20 -6.5l-70 -9v-86h352z" />
+    <glyph glyph-name="uniF281" unicode="&#xf281;" horiz-adv-x="1792" 
+d="M1792 690q0 -58 -29.5 -105.5t-79.5 -72.5q12 -46 12 -96q0 -155 -106.5 -287t-290.5 -208.5t-400 -76.5t-399.5 76.5t-290 208.5t-106.5 287q0 47 11 94q-51 25 -82 73.5t-31 106.5q0 82 58 140.5t141 58.5q85 0 145 -63q218 152 515 162l116 521q3 13 15 21t26 5
+l369 -81q18 37 54 59.5t79 22.5q62 0 106 -43.5t44 -105.5t-44 -106t-106 -44t-105.5 43.5t-43.5 105.5l-334 74l-104 -472q300 -9 519 -160q58 61 143 61q83 0 141 -58.5t58 -140.5zM418 491q0 -62 43.5 -106t105.5 -44t106 44t44 106t-44 105.5t-106 43.5q-61 0 -105 -44
+t-44 -105zM1228 136q11 11 11 26t-11 26q-10 10 -25 10t-26 -10q-41 -42 -121 -62t-160 -20t-160 20t-121 62q-11 10 -26 10t-25 -10q-11 -10 -11 -25.5t11 -26.5q43 -43 118.5 -68t122.5 -29.5t91 -4.5t91 4.5t122.5 29.5t118.5 68zM1225 341q62 0 105.5 44t43.5 106
+q0 61 -44 105t-105 44q-62 0 -106 -43.5t-44 -105.5t44 -106t106 -44z" />
+    <glyph glyph-name="_602" unicode="&#xf282;" horiz-adv-x="1792" 
+d="M69 741h1q16 126 58.5 241.5t115 217t167.5 176t223.5 117.5t276.5 43q231 0 414 -105.5t294 -303.5q104 -187 104 -442v-188h-1125q1 -111 53.5 -192.5t136.5 -122.5t189.5 -57t213 -3t208 46.5t173.5 84.5v-377q-92 -55 -229.5 -92t-312.5 -38t-316 53
+q-189 73 -311.5 249t-124.5 372q-3 242 111 412t325 268q-48 -60 -78 -125.5t-46 -159.5h635q8 77 -8 140t-47 101.5t-70.5 66.5t-80.5 41t-75 20.5t-56 8.5l-22 1q-135 -5 -259.5 -44.5t-223.5 -104.5t-176 -140.5t-138 -163.5z" />
+    <glyph glyph-name="_603" unicode="&#xf283;" horiz-adv-x="2304" 
+d="M0 32v608h2304v-608q0 -66 -47 -113t-113 -47h-1984q-66 0 -113 47t-47 113zM640 256v-128h384v128h-384zM256 256v-128h256v128h-256zM2144 1408q66 0 113 -47t47 -113v-224h-2304v224q0 66 47 113t113 47h1984z" />
+    <glyph glyph-name="_604" unicode="&#xf284;" horiz-adv-x="1792" 
+d="M1584 246l-218 111q-74 -120 -196.5 -189t-263.5 -69q-147 0 -271 72t-196 196t-72 270q0 110 42.5 209.5t115 172t172 115t209.5 42.5q131 0 247.5 -60.5t192.5 -168.5l215 125q-110 169 -286.5 265t-378.5 96q-161 0 -308 -63t-253 -169t-169 -253t-63 -308t63 -308
+t169 -253t253 -169t308 -63q213 0 397.5 107t290.5 292zM1030 643l693 -352q-116 -253 -334.5 -400t-492.5 -147q-182 0 -348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71q260 0 470.5 -133.5t335.5 -366.5zM1543 640h-39v-160h-96v352h136q32 0 54.5 -20
+t28.5 -48t1 -56t-27.5 -48t-57.5 -20z" />
+    <glyph glyph-name="uniF285" unicode="&#xf285;" horiz-adv-x="1792" 
+d="M1427 827l-614 386l92 151h855zM405 562l-184 116v858l1183 -743zM1424 697l147 -95v-858l-532 335zM1387 718l-500 -802h-855l356 571z" />
+    <glyph glyph-name="uniF286" unicode="&#xf286;" horiz-adv-x="1792" 
+d="M640 528v224q0 16 -16 16h-96q-16 0 -16 -16v-224q0 -16 16 -16h96q16 0 16 16zM1152 528v224q0 16 -16 16h-96q-16 0 -16 -16v-224q0 -16 16 -16h96q16 0 16 16zM1664 496v-752h-640v320q0 80 -56 136t-136 56t-136 -56t-56 -136v-320h-640v752q0 16 16 16h96
+q16 0 16 -16v-112h128v624q0 16 16 16h96q16 0 16 -16v-112h128v112q0 16 16 16h96q16 0 16 -16v-112h128v112q0 6 2.5 9.5t8.5 5t9.5 2t11.5 0t9 -0.5v391q-32 15 -32 50q0 23 16.5 39t38.5 16t38.5 -16t16.5 -39q0 -35 -32 -50v-17q45 10 83 10q21 0 59.5 -7.5t54.5 -7.5
+q17 0 47 7.5t37 7.5q16 0 16 -16v-210q0 -15 -35 -21.5t-62 -6.5q-18 0 -54.5 7.5t-55.5 7.5q-40 0 -90 -12v-133q1 0 9 0.5t11.5 0t9.5 -2t8.5 -5t2.5 -9.5v-112h128v112q0 16 16 16h96q16 0 16 -16v-112h128v112q0 16 16 16h96q16 0 16 -16v-624h128v112q0 16 16 16h96
+q16 0 16 -16z" />
+    <glyph glyph-name="_607" unicode="&#xf287;" horiz-adv-x="2304" 
+d="M2288 731q16 -8 16 -27t-16 -27l-320 -192q-8 -5 -16 -5q-9 0 -16 4q-16 10 -16 28v128h-858q37 -58 83 -165q16 -37 24.5 -55t24 -49t27 -47t27 -34t31.5 -26t33 -8h96v96q0 14 9 23t23 9h320q14 0 23 -9t9 -23v-320q0 -14 -9 -23t-23 -9h-320q-14 0 -23 9t-9 23v96h-96
+q-32 0 -61 10t-51 23.5t-45 40.5t-37 46t-33.5 57t-28.5 57.5t-28 60.5q-23 53 -37 81.5t-36 65t-44.5 53.5t-46.5 17h-360q-22 -84 -91 -138t-157 -54q-106 0 -181 75t-75 181t75 181t181 75q88 0 157 -54t91 -138h104q24 0 46.5 17t44.5 53.5t36 65t37 81.5q19 41 28 60.5
+t28.5 57.5t33.5 57t37 46t45 40.5t51 23.5t61 10h107q21 57 70 92.5t111 35.5q80 0 136 -56t56 -136t-56 -136t-136 -56q-62 0 -111 35.5t-70 92.5h-107q-17 0 -33 -8t-31.5 -26t-27 -34t-27 -47t-24 -49t-24.5 -55q-46 -107 -83 -165h1114v128q0 18 16 28t32 -1z" />
+    <glyph glyph-name="_608" unicode="&#xf288;" horiz-adv-x="1792" 
+d="M1150 774q0 -56 -39.5 -95t-95.5 -39h-253v269h253q56 0 95.5 -39.5t39.5 -95.5zM1329 774q0 130 -91.5 222t-222.5 92h-433v-896h180v269h253q130 0 222 91.5t92 221.5zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348
+t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="_609" unicode="&#xf289;" horiz-adv-x="2304" 
+d="M1645 438q0 59 -34 106.5t-87 68.5q-7 -45 -23 -92q-7 -24 -27.5 -38t-44.5 -14q-12 0 -24 3q-31 10 -45 38.5t-4 58.5q23 71 23 143q0 123 -61 227.5t-166 165.5t-228 61q-134 0 -247 -73t-167 -194q108 -28 188 -106q22 -23 22 -55t-22 -54t-54 -22t-55 22
+q-75 75 -180 75q-106 0 -181 -74.5t-75 -180.5t75 -180.5t181 -74.5h1046q79 0 134.5 55.5t55.5 133.5zM1798 438q0 -142 -100.5 -242t-242.5 -100h-1046q-169 0 -289 119.5t-120 288.5q0 153 100 267t249 136q62 184 221 298t354 114q235 0 408.5 -158.5t196.5 -389.5
+q116 -25 192.5 -118.5t76.5 -214.5zM2048 438q0 -175 -97 -319q-23 -33 -64 -33q-24 0 -43 13q-26 17 -32 48.5t12 57.5q71 104 71 233t-71 233q-18 26 -12 57t32 49t57.5 11.5t49.5 -32.5q97 -142 97 -318zM2304 438q0 -244 -134 -443q-23 -34 -64 -34q-23 0 -42 13
+q-26 18 -32.5 49t11.5 57q108 164 108 358q0 195 -108 357q-18 26 -11.5 57.5t32.5 48.5q26 18 57 12t49 -33q134 -198 134 -442z" />
+    <glyph glyph-name="_610" unicode="&#xf28a;" 
+d="M1500 -13q0 -89 -63 -152.5t-153 -63.5t-153.5 63.5t-63.5 152.5q0 90 63.5 153.5t153.5 63.5t153 -63.5t63 -153.5zM1267 268q-115 -15 -192.5 -102.5t-77.5 -205.5q0 -74 33 -138q-146 -78 -379 -78q-109 0 -201 21t-153.5 54.5t-110.5 76.5t-76 85t-44.5 83
+t-23.5 66.5t-6 39.5q0 19 4.5 42.5t18.5 56t36.5 58t64 43.5t94.5 18t94 -17.5t63 -41t35.5 -53t17.5 -49t4 -33.5q0 -34 -23 -81q28 -27 82 -42t93 -17l40 -1q115 0 190 51t75 133q0 26 -9 48.5t-31.5 44.5t-49.5 41t-74 44t-93.5 47.5t-119.5 56.5q-28 13 -43 20
+q-116 55 -187 100t-122.5 102t-72 125.5t-20.5 162.5q0 78 20.5 150t66 137.5t112.5 114t166.5 77t221.5 28.5q120 0 220 -26t164.5 -67t109.5 -94t64 -105.5t19 -103.5q0 -46 -15 -82.5t-36.5 -58t-48.5 -36t-49 -19.5t-39 -5h-8h-32t-39 5t-44 14t-41 28t-37 46t-24 70.5
+t-10 97.5q-15 16 -59 25.5t-81 10.5l-37 1q-68 0 -117.5 -31t-70.5 -70t-21 -76q0 -24 5 -43t24 -46t53 -51t97 -53.5t150 -58.5q76 -25 138.5 -53.5t109 -55.5t83 -59t60.5 -59.5t41 -62.5t26.5 -62t14.5 -63.5t6 -62t1 -62.5z" />
+    <glyph glyph-name="_611" unicode="&#xf28b;" 
+d="M704 352v576q0 14 -9 23t-23 9h-256q-14 0 -23 -9t-9 -23v-576q0 -14 9 -23t23 -9h256q14 0 23 9t9 23zM1152 352v576q0 14 -9 23t-23 9h-256q-14 0 -23 -9t-9 -23v-576q0 -14 9 -23t23 -9h256q14 0 23 9t9 23zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103
+t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_612" unicode="&#xf28c;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM768 96q148 0 273 73t198 198t73 273t-73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273
+t73 -273t198 -198t273 -73zM864 320q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-576q0 -14 -9 -23t-23 -9h-192zM480 320q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h192q14 0 23 -9t9 -23v-576q0 -14 -9 -23t-23 -9h-192z" />
+    <glyph glyph-name="_613" unicode="&#xf28d;" 
+d="M1088 352v576q0 14 -9 23t-23 9h-576q-14 0 -23 -9t-9 -23v-576q0 -14 9 -23t23 -9h576q14 0 23 9t9 23zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5
+t103 -385.5z" />
+    <glyph glyph-name="_614" unicode="&#xf28e;" 
+d="M768 1408q209 0 385.5 -103t279.5 -279.5t103 -385.5t-103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103zM768 96q148 0 273 73t198 198t73 273t-73 273t-198 198t-273 73t-273 -73t-198 -198t-73 -273
+t73 -273t198 -198t273 -73zM480 320q-14 0 -23 9t-9 23v576q0 14 9 23t23 9h576q14 0 23 -9t9 -23v-576q0 -14 -9 -23t-23 -9h-576z" />
+    <glyph glyph-name="_615" unicode="&#xf290;" horiz-adv-x="1792" 
+d="M1757 128l35 -313q3 -28 -16 -50q-19 -21 -48 -21h-1664q-29 0 -48 21q-19 22 -16 50l35 313h1722zM1664 967l86 -775h-1708l86 775q3 24 21 40.5t43 16.5h256v-128q0 -53 37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5v128h384v-128q0 -53 37.5 -90.5t90.5 -37.5
+t90.5 37.5t37.5 90.5v128h256q25 0 43 -16.5t21 -40.5zM1280 1152v-256q0 -26 -19 -45t-45 -19t-45 19t-19 45v256q0 106 -75 181t-181 75t-181 -75t-75 -181v-256q0 -26 -19 -45t-45 -19t-45 19t-19 45v256q0 159 112.5 271.5t271.5 112.5t271.5 -112.5t112.5 -271.5z" />
+    <glyph glyph-name="_616" unicode="&#xf291;" horiz-adv-x="2048" 
+d="M1920 768q53 0 90.5 -37.5t37.5 -90.5t-37.5 -90.5t-90.5 -37.5h-15l-115 -662q-8 -46 -44 -76t-82 -30h-1280q-46 0 -82 30t-44 76l-115 662h-15q-53 0 -90.5 37.5t-37.5 90.5t37.5 90.5t90.5 37.5h1792zM485 -32q26 2 43.5 22.5t15.5 46.5l-32 416q-2 26 -22.5 43.5
+t-46.5 15.5t-43.5 -22.5t-15.5 -46.5l32 -416q2 -25 20.5 -42t43.5 -17h5zM896 32v416q0 26 -19 45t-45 19t-45 -19t-19 -45v-416q0 -26 19 -45t45 -19t45 19t19 45zM1280 32v416q0 26 -19 45t-45 19t-45 -19t-19 -45v-416q0 -26 19 -45t45 -19t45 19t19 45zM1632 27l32 416
+q2 26 -15.5 46.5t-43.5 22.5t-46.5 -15.5t-22.5 -43.5l-32 -416q-2 -26 15.5 -46.5t43.5 -22.5h5q25 0 43.5 17t20.5 42zM476 1244l-93 -412h-132l101 441q19 88 89 143.5t160 55.5h167q0 26 19 45t45 19h384q26 0 45 -19t19 -45h167q90 0 160 -55.5t89 -143.5l101 -441
+h-132l-93 412q-11 44 -45.5 72t-79.5 28h-167q0 -26 -19 -45t-45 -19h-384q-26 0 -45 19t-19 45h-167q-45 0 -79.5 -28t-45.5 -72z" />
+    <glyph glyph-name="_617" unicode="&#xf292;" horiz-adv-x="1792" 
+d="M991 512l64 256h-254l-64 -256h254zM1759 1016l-56 -224q-7 -24 -31 -24h-327l-64 -256h311q15 0 25 -12q10 -14 6 -28l-56 -224q-5 -24 -31 -24h-327l-81 -328q-7 -24 -31 -24h-224q-16 0 -26 12q-9 12 -6 28l78 312h-254l-81 -328q-7 -24 -31 -24h-225q-15 0 -25 12
+q-9 12 -6 28l78 312h-311q-15 0 -25 12q-9 12 -6 28l56 224q7 24 31 24h327l64 256h-311q-15 0 -25 12q-10 14 -6 28l56 224q5 24 31 24h327l81 328q7 24 32 24h224q15 0 25 -12q9 -12 6 -28l-78 -312h254l81 328q7 24 32 24h224q15 0 25 -12q9 -12 6 -28l-78 -312h311
+q15 0 25 -12q9 -12 6 -28z" />
+    <glyph glyph-name="_618" unicode="&#xf293;" 
+d="M841 483l148 -148l-149 -149zM840 1094l149 -149l-148 -148zM710 -130l464 464l-306 306l306 306l-464 464v-611l-255 255l-93 -93l320 -321l-320 -321l93 -93l255 255v-611zM1429 640q0 -209 -32 -365.5t-87.5 -257t-140.5 -162.5t-181.5 -86.5t-219.5 -24.5
+t-219.5 24.5t-181.5 86.5t-140.5 162.5t-87.5 257t-32 365.5t32 365.5t87.5 257t140.5 162.5t181.5 86.5t219.5 24.5t219.5 -24.5t181.5 -86.5t140.5 -162.5t87.5 -257t32 -365.5z" />
+    <glyph glyph-name="_619" unicode="&#xf294;" horiz-adv-x="1024" 
+d="M596 113l173 172l-173 172v-344zM596 823l173 172l-173 172v-344zM628 640l356 -356l-539 -540v711l-297 -296l-108 108l372 373l-372 373l108 108l297 -296v711l539 -540z" />
+    <glyph glyph-name="_620" unicode="&#xf295;" 
+d="M1280 256q0 52 -38 90t-90 38t-90 -38t-38 -90t38 -90t90 -38t90 38t38 90zM512 1024q0 52 -38 90t-90 38t-90 -38t-38 -90t38 -90t90 -38t90 38t38 90zM1536 256q0 -159 -112.5 -271.5t-271.5 -112.5t-271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5t271.5 -112.5
+t112.5 -271.5zM1440 1344q0 -20 -13 -38l-1056 -1408q-19 -26 -51 -26h-160q-26 0 -45 19t-19 45q0 20 13 38l1056 1408q19 26 51 26h160q26 0 45 -19t19 -45zM768 1024q0 -159 -112.5 -271.5t-271.5 -112.5t-271.5 112.5t-112.5 271.5t112.5 271.5t271.5 112.5
+t271.5 -112.5t112.5 -271.5z" />
+    <glyph glyph-name="_621" unicode="&#xf296;" horiz-adv-x="1792" 
+d="M104 830l792 -1015l-868 630q-18 13 -25 34.5t0 42.5l101 308v0zM566 830h660l-330 -1015v0zM368 1442l198 -612h-462l198 612q8 23 33 23t33 -23zM1688 830l101 -308q7 -21 0 -42.5t-25 -34.5l-868 -630l792 1015v0zM1688 830h-462l198 612q8 23 33 23t33 -23z" />
+    <glyph glyph-name="_622" unicode="&#xf297;" horiz-adv-x="1792" 
+d="M384 704h160v224h-160v-224zM1221 372v92q-104 -36 -243 -38q-135 -1 -259.5 46.5t-220.5 122.5l1 -96q88 -80 212 -128.5t272 -47.5q129 0 238 49zM640 704h640v224h-640v-224zM1792 736q0 -187 -99 -352q89 -102 89 -229q0 -157 -129.5 -268t-313.5 -111
+q-122 0 -225 52.5t-161 140.5q-19 -1 -57 -1t-57 1q-58 -88 -161 -140.5t-225 -52.5q-184 0 -313.5 111t-129.5 268q0 127 89 229q-99 165 -99 352q0 209 120 385.5t326.5 279.5t449.5 103t449.5 -103t326.5 -279.5t120 -385.5z" />
+    <glyph glyph-name="_623" unicode="&#xf298;" 
+d="M515 625v-128h-252v128h252zM515 880v-127h-252v127h252zM1273 369v-128h-341v128h341zM1273 625v-128h-672v128h672zM1273 880v-127h-672v127h672zM1408 20v1240q0 8 -6 14t-14 6h-32l-378 -256l-210 171l-210 -171l-378 256h-32q-8 0 -14 -6t-6 -14v-1240q0 -8 6 -14
+t14 -6h1240q8 0 14 6t6 14zM553 1130l185 150h-406zM983 1130l221 150h-406zM1536 1260v-1240q0 -62 -43 -105t-105 -43h-1240q-62 0 -105 43t-43 105v1240q0 62 43 105t105 43h1240q62 0 105 -43t43 -105z" />
+    <glyph glyph-name="_624" unicode="&#xf299;" horiz-adv-x="1792" 
+d="M896 720q-104 196 -160 278q-139 202 -347 318q-34 19 -70 36q-89 40 -94 32t34 -38l39 -31q62 -43 112.5 -93.5t94.5 -116.5t70.5 -113t70.5 -131q9 -17 13 -25q44 -84 84 -153t98 -154t115.5 -150t131 -123.5t148.5 -90.5q153 -66 154 -60q1 3 -49 37q-53 36 -81 57
+q-77 58 -179 211t-185 310zM549 177q-76 60 -132.5 125t-98 143.5t-71 154.5t-58.5 186t-52 209t-60.5 252t-76.5 289q273 0 497.5 -36t379 -92t271 -144.5t185.5 -172.5t110 -198.5t56 -199.5t12.5 -198.5t-9.5 -173t-20 -143.5t-13 -107l323 -327h-104l-281 285
+q-22 -2 -91.5 -14t-121.5 -19t-138 -6t-160.5 17t-167.5 59t-179 111z" />
+    <glyph glyph-name="_625" unicode="&#xf29a;" horiz-adv-x="1792" 
+d="M1374 879q-6 26 -28.5 39.5t-48.5 7.5q-261 -62 -401 -62t-401 62q-26 6 -48.5 -7.5t-28.5 -39.5t7.5 -48.5t39.5 -28.5q194 -46 303 -58q-2 -158 -15.5 -269t-26.5 -155.5t-41 -115.5l-9 -21q-10 -25 1 -49t36 -34q9 -4 23 -4q44 0 60 41l8 20q54 139 71 259h42
+q17 -120 71 -259l8 -20q16 -41 60 -41q14 0 23 4q25 10 36 34t1 49l-9 21q-28 71 -41 115.5t-26.5 155.5t-15.5 269q109 12 303 58q26 6 39.5 28.5t7.5 48.5zM1024 1024q0 53 -37.5 90.5t-90.5 37.5t-90.5 -37.5t-37.5 -90.5t37.5 -90.5t90.5 -37.5t90.5 37.5t37.5 90.5z
+M1600 640q0 -143 -55.5 -273.5t-150 -225t-225 -150t-273.5 -55.5t-273.5 55.5t-225 150t-150 225t-55.5 273.5t55.5 273.5t150 225t225 150t273.5 55.5t273.5 -55.5t225 -150t150 -225t55.5 -273.5zM896 1408q-156 0 -298 -61t-245 -164t-164 -245t-61 -298t61 -298
+t164 -245t245 -164t298 -61t298 61t245 164t164 245t61 298t-61 298t-164 245t-245 164t-298 61zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="_626" unicode="&#xf29b;" 
+d="M1438 723q34 -35 29 -82l-44 -551q-4 -42 -34.5 -70t-71.5 -28q-6 0 -9 1q-44 3 -72.5 36.5t-25.5 77.5l35 429l-143 -8q55 -113 55 -240q0 -216 -148 -372l-137 137q91 101 91 235q0 145 -102.5 248t-247.5 103q-134 0 -236 -92l-137 138q120 114 284 141l264 300
+l-149 87l-181 -161q-33 -30 -77 -27.5t-73 35.5t-26.5 77t34.5 73l239 213q26 23 60 26.5t64 -14.5l488 -283q36 -21 48 -68q17 -67 -26 -117l-205 -232l371 20q49 3 83 -32zM1240 1180q-74 0 -126 52t-52 126t52 126t126 52t126.5 -52t52.5 -126t-52.5 -126t-126.5 -52z
+M613 -62q106 0 196 61l139 -139q-146 -116 -335 -116q-148 0 -273.5 73t-198.5 198t-73 273q0 188 116 336l139 -139q-60 -88 -60 -197q0 -145 102.5 -247.5t247.5 -102.5z" />
+    <glyph glyph-name="_627" unicode="&#xf29c;" 
+d="M880 336v-160q0 -14 -9 -23t-23 -9h-160q-14 0 -23 9t-9 23v160q0 14 9 23t23 9h160q14 0 23 -9t9 -23zM1136 832q0 -50 -15 -90t-45.5 -69t-52 -44t-59.5 -36q-32 -18 -46.5 -28t-26 -24t-11.5 -29v-32q0 -14 -9 -23t-23 -9h-160q-14 0 -23 9t-9 23v68q0 35 10.5 64.5
+t24 47.5t39 35.5t41 25.5t44.5 21q53 25 75 43t22 49q0 42 -43.5 71.5t-95.5 29.5q-56 0 -95 -27q-29 -20 -80 -83q-9 -12 -25 -12q-11 0 -19 6l-108 82q-10 7 -12 20t5 23q122 192 349 192q129 0 238.5 -89.5t109.5 -214.5zM768 1280q-130 0 -248.5 -51t-204 -136.5
+t-136.5 -204t-51 -248.5t51 -248.5t136.5 -204t204 -136.5t248.5 -51t248.5 51t204 136.5t136.5 204t51 248.5t-51 248.5t-136.5 204t-204 136.5t-248.5 51zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5
+t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="_628" unicode="&#xf29d;" horiz-adv-x="1408" 
+d="M366 1225q-64 0 -110 45.5t-46 110.5q0 64 46 109.5t110 45.5t109.5 -45.5t45.5 -109.5q0 -65 -45.5 -110.5t-109.5 -45.5zM917 583q0 -50 -30 -67.5t-63.5 -6.5t-47.5 34l-367 438q-7 12 -14 15.5t-11 1.5l-3 -3q-7 -8 4 -21l122 -139l1 -354l-161 -457
+q-67 -192 -92 -234q-15 -26 -28 -32q-50 -26 -103 -1q-29 13 -41.5 43t-9.5 57q2 17 197 618l5 416l-85 -164l35 -222q4 -24 -1 -42t-14 -27.5t-19 -16t-17 -7.5l-7 -2q-19 -3 -34.5 3t-24 16t-14 22t-7.5 19.5t-2 9.5l-46 299l211 381q23 34 113 34q75 0 107 -40l424 -521
+q7 -5 14 -17l3 -3l-1 -1q7 -13 7 -29zM514 433q43 -113 88.5 -225t69.5 -168l24 -55q36 -93 42 -125q11 -70 -36 -97q-35 -22 -66 -16t-51 22t-29 35h-1q-6 16 -8 25l-124 351zM1338 -159q31 -49 31 -57q0 -5 -3 -7q-9 -5 -14.5 0.5t-15.5 26t-16 30.5q-114 172 -423 661
+q3 -1 7 1t7 4l3 2q11 9 11 17z" />
+    <glyph glyph-name="_629" unicode="&#xf29e;" horiz-adv-x="2304" 
+d="M504 542h171l-1 265zM1530 641q0 87 -50.5 140t-146.5 53h-54v-388h52q91 0 145 57t54 138zM956 1018l1 -756q0 -14 -9.5 -24t-23.5 -10h-216q-14 0 -23.5 10t-9.5 24v62h-291l-55 -81q-10 -15 -28 -15h-267q-21 0 -30.5 18t3.5 35l556 757q9 14 27 14h332q14 0 24 -10
+t10 -24zM1783 641q0 -193 -125.5 -303t-324.5 -110h-270q-14 0 -24 10t-10 24v756q0 14 10 24t24 10h268q200 0 326 -109t126 -302zM1939 640q0 -11 -0.5 -29t-8 -71.5t-21.5 -102t-44.5 -108t-73.5 -102.5h-51q38 45 66.5 104.5t41.5 112t21 98t9 72.5l1 27q0 8 -0.5 22.5
+t-7.5 60t-20 91.5t-41 111.5t-66 124.5h43q41 -47 72 -107t45.5 -111.5t23 -96t10.5 -70.5zM2123 640q0 -11 -0.5 -29t-8 -71.5t-21.5 -102t-45 -108t-74 -102.5h-51q38 45 66.5 104.5t41.5 112t21 98t9 72.5l1 27q0 8 -0.5 22.5t-7.5 60t-19.5 91.5t-40.5 111.5t-66 124.5
+h43q41 -47 72 -107t45.5 -111.5t23 -96t10.5 -70.5zM2304 640q0 -11 -0.5 -29t-8 -71.5t-21.5 -102t-44.5 -108t-73.5 -102.5h-51q38 45 66 104.5t41 112t21 98t9 72.5l1 27q0 8 -0.5 22.5t-7.5 60t-19.5 91.5t-40.5 111.5t-66 124.5h43q41 -47 72 -107t45.5 -111.5t23 -96
+t9.5 -70.5z" />
+    <glyph glyph-name="uniF2A0" unicode="&#xf2a0;" horiz-adv-x="1408" 
+d="M617 -153q0 11 -13 58t-31 107t-20 69q-1 4 -5 26.5t-8.5 36t-13.5 21.5q-15 14 -51 14q-23 0 -70 -5.5t-71 -5.5q-34 0 -47 11q-6 5 -11 15.5t-7.5 20t-6.5 24t-5 18.5q-37 128 -37 255t37 255q1 4 5 18.5t6.5 24t7.5 20t11 15.5q13 11 47 11q24 0 71 -5.5t70 -5.5
+q36 0 51 14q9 8 13.5 21.5t8.5 36t5 26.5q2 9 20 69t31 107t13 58q0 22 -43.5 52.5t-75.5 42.5q-20 8 -45 8q-34 0 -98 -18q-57 -17 -96.5 -40.5t-71 -66t-46 -70t-45.5 -94.5q-6 -12 -9 -19q-49 -107 -68 -216t-19 -244t19 -244t68 -216q56 -122 83 -161q63 -91 179 -127
+l6 -2q64 -18 98 -18q25 0 45 8q32 12 75.5 42.5t43.5 52.5zM776 760q-26 0 -45 19t-19 45.5t19 45.5q37 37 37 90q0 52 -37 91q-19 19 -19 45t19 45t45 19t45 -19q75 -75 75 -181t-75 -181q-21 -19 -45 -19zM957 579q-27 0 -45 19q-19 19 -19 45t19 45q112 114 112 272
+t-112 272q-19 19 -19 45t19 45t45 19t45 -19q150 -150 150 -362t-150 -362q-18 -19 -45 -19zM1138 398q-27 0 -45 19q-19 19 -19 45t19 45q90 91 138.5 208t48.5 245t-48.5 245t-138.5 208q-19 19 -19 45t19 45t45 19t45 -19q109 -109 167 -249t58 -294t-58 -294t-167 -249
+q-18 -19 -45 -19z" />
+    <glyph glyph-name="uniF2A1" unicode="&#xf2a1;" horiz-adv-x="2176" 
+d="M192 352q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM704 352q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM704 864q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM1472 352
+q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM1984 352q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM1472 864q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM1984 864
+q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM1984 1376q-66 0 -113 -47t-47 -113t47 -113t113 -47t113 47t47 113t-47 113t-113 47zM384 192q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM896 192q0 -80 -56 -136
+t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM384 704q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM896 704q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM384 1216q0 -80 -56 -136t-136 -56
+t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1664 192q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM896 1216q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM2176 192q0 -80 -56 -136t-136 -56t-136 56
+t-56 136t56 136t136 56t136 -56t56 -136zM1664 704q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM2176 704q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136zM1664 1216q0 -80 -56 -136t-136 -56t-136 56t-56 136
+t56 136t136 56t136 -56t56 -136zM2176 1216q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136z" />
+    <glyph glyph-name="uniF2A2" unicode="&#xf2a2;" horiz-adv-x="1792" 
+d="M128 -192q0 -26 -19 -45t-45 -19t-45 19t-19 45t19 45t45 19t45 -19t19 -45zM320 0q0 -26 -19 -45t-45 -19t-45 19t-19 45t19 45t45 19t45 -19t19 -45zM365 365l256 -256l-90 -90l-256 256zM704 384q0 -26 -19 -45t-45 -19t-45 19t-19 45t19 45t45 19t45 -19t19 -45z
+M1411 704q0 -59 -11.5 -108.5t-37.5 -93.5t-44 -67.5t-53 -64.5q-31 -35 -45.5 -54t-33.5 -50t-26.5 -64t-7.5 -74q0 -159 -112.5 -271.5t-271.5 -112.5q-26 0 -45 19t-19 45t19 45t45 19q106 0 181 75t75 181q0 57 11.5 105.5t37 91t43.5 66.5t52 63q40 46 59.5 72
+t37.5 74.5t18 103.5q0 185 -131.5 316.5t-316.5 131.5t-316.5 -131.5t-131.5 -316.5q0 -26 -19 -45t-45 -19t-45 19t-19 45q0 117 45.5 223.5t123 184t184 123t223.5 45.5t223.5 -45.5t184 -123t123 -184t45.5 -223.5zM896 576q0 -26 -19 -45t-45 -19t-45 19t-19 45t19 45
+t45 19t45 -19t19 -45zM1184 704q0 -26 -19 -45t-45 -19t-45 19t-19 45q0 93 -65.5 158.5t-158.5 65.5q-92 0 -158 -65.5t-66 -158.5q0 -26 -19 -45t-45 -19t-45 19t-19 45q0 146 103 249t249 103t249 -103t103 -249zM1578 993q10 -25 -1 -49t-36 -34q-9 -4 -23 -4
+q-19 0 -35.5 11t-23.5 30q-68 178 -224 295q-21 16 -25 42t12 47q17 21 43 25t47 -12q183 -137 266 -351zM1788 1074q9 -25 -1.5 -49t-35.5 -34q-11 -4 -23 -4q-44 0 -60 41q-92 238 -297 393q-22 16 -25.5 42t12.5 47q16 22 42 25.5t47 -12.5q235 -175 341 -449z" />
+    <glyph glyph-name="uniF2A3" unicode="&#xf2a3;" horiz-adv-x="2304" 
+d="M1032 576q-59 2 -84 55q-17 34 -48 53.5t-68 19.5q-53 0 -90.5 -37.5t-37.5 -90.5q0 -56 36 -89l10 -8q34 -31 82 -31q37 0 68 19.5t48 53.5q25 53 84 55zM1600 704q0 56 -36 89l-10 8q-34 31 -82 31q-37 0 -68 -19.5t-48 -53.5q-25 -53 -84 -55q59 -2 84 -55
+q17 -34 48 -53.5t68 -19.5q53 0 90.5 37.5t37.5 90.5zM1174 925q-17 -35 -55 -48t-73 4q-62 31 -134 31q-51 0 -99 -17q3 0 9.5 0.5t9.5 0.5q92 0 170.5 -50t118.5 -133q17 -36 3.5 -73.5t-49.5 -54.5q-18 -9 -39 -9q21 0 39 -9q36 -17 49.5 -54.5t-3.5 -73.5
+q-40 -83 -118.5 -133t-170.5 -50h-6q-16 2 -44 4l-290 27l-239 -120q-14 -7 -29 -7q-40 0 -57 35l-160 320q-11 23 -4 47.5t29 37.5l209 119l148 267q17 155 91.5 291.5t195.5 236.5q31 25 70.5 21.5t64.5 -34.5t21.5 -70t-34.5 -65q-70 -59 -117 -128q123 84 267 101
+q40 5 71.5 -19t35.5 -64q5 -40 -19 -71.5t-64 -35.5q-84 -10 -159 -55q46 10 99 10q115 0 218 -50q36 -18 49 -55.5t-5 -73.5zM2137 1085l160 -320q11 -23 4 -47.5t-29 -37.5l-209 -119l-148 -267q-17 -155 -91.5 -291.5t-195.5 -236.5q-26 -22 -61 -22q-45 0 -74 35
+q-25 31 -21.5 70t34.5 65q70 59 117 128q-123 -84 -267 -101q-4 -1 -12 -1q-36 0 -63.5 24t-31.5 60q-5 40 19 71.5t64 35.5q84 10 159 55q-46 -10 -99 -10q-115 0 -218 50q-36 18 -49 55.5t5 73.5q17 35 55 48t73 -4q62 -31 134 -31q51 0 99 17q-3 0 -9.5 -0.5t-9.5 -0.5
+q-92 0 -170.5 50t-118.5 133q-17 36 -3.5 73.5t49.5 54.5q18 9 39 9q-21 0 -39 9q-36 17 -49.5 54.5t3.5 73.5q40 83 118.5 133t170.5 50h6h1q14 -2 42 -4l291 -27l239 120q14 7 29 7q40 0 57 -35z" />
+    <glyph glyph-name="uniF2A4" unicode="&#xf2a4;" horiz-adv-x="1792" 
+d="M1056 704q0 -26 19 -45t45 -19t45 19t19 45q0 146 -103 249t-249 103t-249 -103t-103 -249q0 -26 19 -45t45 -19t45 19t19 45q0 93 66 158.5t158 65.5t158 -65.5t66 -158.5zM835 1280q-117 0 -223.5 -45.5t-184 -123t-123 -184t-45.5 -223.5q0 -26 19 -45t45 -19t45 19
+t19 45q0 185 131.5 316.5t316.5 131.5t316.5 -131.5t131.5 -316.5q0 -55 -18 -103.5t-37.5 -74.5t-59.5 -72q-34 -39 -52 -63t-43.5 -66.5t-37 -91t-11.5 -105.5q0 -106 -75 -181t-181 -75q-26 0 -45 -19t-19 -45t19 -45t45 -19q159 0 271.5 112.5t112.5 271.5q0 41 7.5 74
+t26.5 64t33.5 50t45.5 54q35 41 53 64.5t44 67.5t37.5 93.5t11.5 108.5q0 117 -45.5 223.5t-123 184t-184 123t-223.5 45.5zM591 561l226 -226l-579 -579q-12 -12 -29 -12t-29 12l-168 168q-12 12 -12 29t12 29zM1612 1524l168 -168q12 -12 12 -29t-12 -30l-233 -233
+l-26 -25l-71 -71q-66 153 -195 258l91 91l207 207q13 12 30 12t29 -12z" />
+    <glyph glyph-name="uniF2A5" unicode="&#xf2a5;" 
+d="M866 1021q0 -27 -13 -94q-11 -50 -31.5 -150t-30.5 -150q-2 -11 -4.5 -12.5t-13.5 -2.5q-20 -2 -31 -2q-58 0 -84 49.5t-26 113.5q0 88 35 174t103 124q28 14 51 14q28 0 36.5 -16.5t8.5 -47.5zM1352 597q0 14 -39 75.5t-52 66.5q-21 8 -34 8q-91 0 -226 -77l-2 2
+q3 22 27.5 135t24.5 178q0 233 -242 233q-24 0 -68 -6q-94 -17 -168.5 -89.5t-111.5 -166.5t-37 -189q0 -146 80.5 -225t227.5 -79q25 0 25 -3t-1 -5q-4 -34 -26 -117q-14 -52 -51.5 -101t-82.5 -49q-42 0 -42 47q0 24 10.5 47.5t25 39.5t29.5 28.5t26 20t11 8.5q0 3 -7 10
+q-24 22 -58.5 36.5t-65.5 14.5q-35 0 -63.5 -34t-41 -75t-12.5 -75q0 -88 51.5 -142t138.5 -54q82 0 155 53t117.5 126t65.5 153q6 22 15.5 66.5t14.5 66.5q3 12 14 18q118 60 227 60q48 0 127 -18q1 -1 4 -1q5 0 9.5 4.5t4.5 8.5zM1536 1120v-960q0 -119 -84.5 -203.5
+t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="uniF2A6" unicode="&#xf2a6;" horiz-adv-x="1535" 
+d="M744 1231q0 24 -2 38.5t-8.5 30t-21 23t-37.5 7.5q-39 0 -78 -23q-105 -58 -159 -190.5t-54 -269.5q0 -44 8.5 -85.5t26.5 -80.5t52.5 -62.5t81.5 -23.5q4 0 18 -0.5t20 0t16 3t15 8.5t7 16q16 77 48 231.5t48 231.5q19 91 19 146zM1498 575q0 -7 -7.5 -13.5t-15.5 -6.5
+l-6 1q-22 3 -62 11t-72 12.5t-63 4.5q-167 0 -351 -93q-15 -8 -21 -27q-10 -36 -24.5 -105.5t-22.5 -100.5q-23 -91 -70 -179.5t-112.5 -164.5t-154.5 -123t-185 -47q-135 0 -214.5 83.5t-79.5 219.5q0 53 19.5 117t63 116.5t97.5 52.5q38 0 120 -33.5t83 -61.5
+q0 -1 -16.5 -12.5t-39.5 -31t-46 -44.5t-39 -61t-16 -74q0 -33 16.5 -53t48.5 -20q45 0 85 31.5t66.5 78t48 105.5t32.5 107t16 90v9q0 2 -3.5 3.5t-8.5 1.5h-10t-10 -0.5t-6 -0.5q-227 0 -352 122.5t-125 348.5q0 108 34.5 221t96 210t156 167.5t204.5 89.5q52 9 106 9
+q374 0 374 -360q0 -98 -38 -273t-43 -211l3 -3q101 57 182.5 88t167.5 31q22 0 53 -13q19 -7 80 -102.5t61 -116.5z" />
+    <glyph glyph-name="uniF2A7" unicode="&#xf2a7;" horiz-adv-x="1664" 
+d="M831 863q32 0 59 -18l222 -148q61 -40 110 -97l146 -170q40 -46 29 -106l-72 -413q-6 -32 -29.5 -53.5t-55.5 -25.5l-527 -56l-352 -32h-9q-39 0 -67.5 28t-28.5 68q0 37 27 64t65 32l260 32h-448q-41 0 -69.5 30t-26.5 71q2 39 32 65t69 26l442 1l-521 64q-41 5 -66 37
+t-19 73q6 35 34.5 57.5t65.5 22.5h10l481 -60l-351 94q-38 10 -62 41.5t-18 68.5q6 36 33 58.5t62 22.5q6 0 20 -2l448 -96l217 -37q1 0 3 -0.5t3 -0.5q23 0 30.5 23t-12.5 36l-186 125q-35 23 -42 63.5t18 73.5q27 38 76 38zM761 661l186 -125l-218 37l-5 2l-36 38
+l-238 262q-1 1 -2.5 3.5t-2.5 3.5q-24 31 -18.5 70t37.5 64q31 23 68 17.5t64 -33.5l142 -147q-2 -1 -5 -3.5t-4 -4.5q-32 -45 -23 -99t55 -85zM1648 1115l15 -266q4 -73 -11 -147l-48 -219q-12 -59 -67 -87l-106 -54q2 62 -39 109l-146 170q-53 61 -117 103l-222 148
+q-34 23 -76 23q-51 0 -88 -37l-235 312q-25 33 -18 73.5t41 63.5q33 22 71.5 14t62.5 -40l266 -352l-262 455q-21 35 -10.5 75t47.5 59q35 18 72.5 6t57.5 -46l241 -420l-136 337q-15 35 -4.5 74t44.5 56q37 19 76 6t56 -51l193 -415l101 -196q8 -15 23 -17.5t27 7.5t11 26
+l-12 224q-2 41 26 71t69 31q39 0 67 -28.5t30 -67.5z" />
+    <glyph glyph-name="uniF2A8" unicode="&#xf2a8;" horiz-adv-x="1792" 
+d="M335 180q-2 0 -6 2q-86 57 -168.5 145t-139.5 180q-21 30 -21 69q0 9 2 19t4 18t7 18t8.5 16t10.5 17t10 15t12 15.5t11 14.5q184 251 452 365q-110 198 -110 211q0 19 17 29q116 64 128 64q18 0 28 -16l124 -229q92 19 192 19q266 0 497.5 -137.5t378.5 -369.5
+q20 -31 20 -69t-20 -69q-91 -142 -218.5 -253.5t-278.5 -175.5q110 -198 110 -211q0 -20 -17 -29q-116 -64 -127 -64q-19 0 -29 16l-124 229l-64 119l-444 820l7 7q-58 -24 -99 -47q3 -5 127 -234t243 -449t119 -223q0 -7 -9 -9q-13 -3 -72 -3q-57 0 -60 7l-456 841
+q-39 -28 -82 -68q24 -43 214 -393.5t190 -354.5q0 -10 -11 -10q-14 0 -82.5 22t-72.5 28l-106 197l-224 413q-44 -53 -78 -106q2 -3 18 -25t23 -34l176 -327q0 -10 -10 -10zM1165 282l49 -91q273 111 450 385q-180 277 -459 389q67 -64 103 -148.5t36 -176.5
+q0 -106 -47 -200.5t-132 -157.5zM848 896q0 -20 14 -34t34 -14q86 0 147 -61t61 -147q0 -20 14 -34t34 -14t34 14t14 34q0 126 -89 215t-215 89q-20 0 -34 -14t-14 -34zM1214 961l-9 4l7 -7z" />
+    <glyph glyph-name="uniF2A9" unicode="&#xf2a9;" horiz-adv-x="1280" 
+d="M1050 430q0 -215 -147 -374q-148 -161 -378 -161q-232 0 -378 161q-147 159 -147 374q0 147 68 270.5t189 196.5t268 73q96 0 182 -31q-32 -62 -39 -126q-66 28 -143 28q-167 0 -280.5 -123t-113.5 -291q0 -170 112.5 -288.5t281.5 -118.5t281 118.5t112 288.5
+q0 89 -32 166q66 13 123 49q41 -98 41 -212zM846 619q0 -192 -79.5 -345t-238.5 -253l-14 -1q-29 0 -62 5q83 32 146.5 102.5t99.5 154.5t58.5 189t30 192.5t7.5 178.5q0 69 -3 103q55 -160 55 -326zM791 947v-2q-73 214 -206 440q88 -59 142.5 -186.5t63.5 -251.5z
+M1035 744q-83 0 -160 75q218 120 290 247q19 37 21 56q-42 -94 -139.5 -166.5t-204.5 -97.5q-35 54 -35 113q0 37 17 79t43 68q46 44 157 74q59 16 106 58.5t74 100.5q74 -105 74 -253q0 -109 -24 -170q-32 -77 -88.5 -130.5t-130.5 -53.5z" />
+    <glyph glyph-name="uniF2AA" unicode="&#xf2aa;" 
+d="M1050 495q0 78 -28 147q-41 -25 -85 -34q22 -50 22 -114q0 -117 -77 -198.5t-193 -81.5t-193.5 81.5t-77.5 198.5q0 115 78 199.5t193 84.5q53 0 98 -19q4 43 27 87q-60 21 -125 21q-154 0 -257.5 -108.5t-103.5 -263.5t103.5 -261t257.5 -106t257.5 106.5t103.5 260.5z
+M872 850q2 -24 2 -71q0 -63 -5 -123t-20.5 -132.5t-40.5 -130t-68.5 -106t-100.5 -70.5q21 -3 42 -3h10q219 139 219 411q0 116 -38 225zM872 850q-4 80 -44 171.5t-98 130.5q92 -156 142 -302zM1207 955q0 102 -51 174q-41 -86 -124 -109q-69 -19 -109 -53.5t-40 -99.5
+q0 -40 24 -77q74 17 140.5 67t95.5 115q-4 -52 -74.5 -111.5t-138.5 -97.5q52 -52 110 -52q51 0 90 37t60 90q17 42 17 117zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960q119 0 203.5 -84.5
+t84.5 -203.5z" />
+    <glyph glyph-name="uniF2AB" unicode="&#xf2ab;" 
+d="M1279 388q0 22 -22 27q-67 15 -118 59t-80 108q-7 19 -7 25q0 15 19.5 26t43 17t43 20.5t19.5 36.5q0 19 -18.5 31.5t-38.5 12.5q-12 0 -32 -8t-31 -8q-4 0 -12 2q5 95 5 114q0 79 -17 114q-36 78 -103 121.5t-152 43.5q-199 0 -275 -165q-17 -35 -17 -114q0 -19 5 -114
+q-4 -2 -14 -2q-12 0 -32 7.5t-30 7.5q-21 0 -38.5 -12t-17.5 -32q0 -21 19.5 -35.5t43 -20.5t43 -17t19.5 -26q0 -6 -7 -25q-64 -138 -198 -167q-22 -5 -22 -27q0 -46 137 -68q2 -5 6 -26t11.5 -30.5t23.5 -9.5q12 0 37.5 4.5t39.5 4.5q35 0 67 -15t54 -32.5t57.5 -32.5
+t76.5 -15q43 0 79 15t57.5 32.5t53.5 32.5t67 15q14 0 39.5 -4t38.5 -4q16 0 23 10t11 30t6 25q137 22 137 68zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5
+t103 -385.5z" />
+    <glyph glyph-name="uniF2AC" unicode="&#xf2ac;" horiz-adv-x="1664" 
+d="M848 1408q134 1 240.5 -68.5t163.5 -192.5q27 -58 27 -179q0 -47 -9 -191q14 -7 28 -7q18 0 51 13.5t51 13.5q29 0 56 -18t27 -46q0 -32 -31.5 -54t-69 -31.5t-69 -29t-31.5 -47.5q0 -15 12 -43q37 -82 102.5 -150t144.5 -101q28 -12 80 -23q28 -6 28 -35
+q0 -70 -219 -103q-7 -11 -11 -39t-14 -46.5t-33 -18.5q-20 0 -62 6.5t-64 6.5q-37 0 -62 -5q-32 -5 -63 -22.5t-58 -38t-58 -40.5t-76 -33.5t-99 -13.5q-52 0 -96.5 13.5t-75 33.5t-57.5 40.5t-58 38t-62 22.5q-26 5 -63 5q-24 0 -65.5 -7.5t-58.5 -7.5q-25 0 -35 18.5
+t-14 47.5t-11 40q-219 33 -219 103q0 29 28 35q52 11 80 23q78 32 144.5 101t102.5 150q12 28 12 43q0 28 -31.5 47.5t-69.5 29.5t-69.5 31.5t-31.5 52.5q0 27 26 45.5t55 18.5q15 0 48 -13t53 -13q18 0 32 7q-9 142 -9 190q0 122 27 180q64 137 172 198t264 63z" />
+    <glyph glyph-name="uniF2AD" unicode="&#xf2ad;" 
+d="M1280 388q0 22 -22 27q-67 14 -118 58t-80 109q-7 14 -7 25q0 15 19.5 26t42.5 17t42.5 20.5t19.5 36.5q0 19 -18.5 31.5t-38.5 12.5q-11 0 -31 -8t-32 -8q-4 0 -12 2q5 63 5 115q0 78 -17 114q-36 78 -102.5 121.5t-152.5 43.5q-198 0 -275 -165q-18 -38 -18 -115
+q0 -38 6 -114q-10 -2 -15 -2q-11 0 -31.5 8t-30.5 8q-20 0 -37.5 -12.5t-17.5 -32.5q0 -21 19.5 -35.5t42.5 -20.5t42.5 -17t19.5 -26q0 -11 -7 -25q-64 -138 -198 -167q-22 -5 -22 -27q0 -47 138 -69q2 -5 6 -26t11 -30.5t23 -9.5q13 0 38.5 5t38.5 5q35 0 67.5 -15
+t54.5 -32.5t57.5 -32.5t76.5 -15q43 0 79 15t57.5 32.5t54 32.5t67.5 15q13 0 39 -4.5t39 -4.5q15 0 22.5 9.5t11.5 31t5 24.5q138 22 138 69zM1536 1120v-960q0 -119 -84.5 -203.5t-203.5 -84.5h-960q-119 0 -203.5 84.5t-84.5 203.5v960q0 119 84.5 203.5t203.5 84.5h960
+q119 0 203.5 -84.5t84.5 -203.5z" />
+    <glyph glyph-name="uniF2AE" unicode="&#xf2ae;" horiz-adv-x="2304" 
+d="M2304 1536q-69 -46 -125 -92t-89 -81t-59.5 -71.5t-37.5 -57.5t-22 -44.5t-14 -29.5q-10 -18 -35.5 -136.5t-48.5 -164.5q-15 -29 -50 -60.5t-67.5 -50.5t-72.5 -41t-48 -28q-47 -31 -151 -231q-341 14 -630 -158q-92 -53 -303 -179q47 16 86 31t55 22l15 7
+q71 27 163 64.5t133.5 53.5t108 34.5t142.5 31.5q186 31 465 -7q1 0 10 -3q11 -6 14 -17t-3 -22l-194 -345q-15 -29 -47 -22q-128 24 -354 24q-146 0 -402 -44.5t-392 -46.5q-82 -1 -149 13t-107 37t-61 40t-33 34l-1 1v2q0 6 6 6q138 0 371 55q192 366 374.5 524t383.5 158
+q5 0 14.5 -0.5t38 -5t55 -12t61.5 -24.5t63 -39.5t54 -59t40 -82.5l102 177q2 4 21 42.5t44.5 86.5t61 109.5t84 133.5t100.5 137q66 82 128 141.5t121.5 96.5t92.5 53.5t88 39.5z" />
+    <glyph glyph-name="uniF2B0" unicode="&#xf2b0;" 
+d="M1322 640q0 -45 -5 -76l-236 14l224 -78q-19 -73 -58 -141l-214 103l177 -158q-44 -61 -107 -108l-157 178l103 -215q-61 -37 -140 -59l-79 228l14 -240q-38 -6 -76 -6t-76 6l14 238l-78 -226q-74 19 -140 59l103 215l-157 -178q-59 43 -108 108l178 158l-214 -104
+q-39 69 -58 141l224 79l-237 -14q-5 42 -5 76q0 35 5 77l238 -14l-225 79q19 73 58 140l214 -104l-177 159q46 61 107 108l158 -178l-103 215q67 39 140 58l77 -224l-13 236q36 6 75 6q38 0 76 -6l-14 -237l78 225q74 -19 140 -59l-103 -214l158 178q61 -47 107 -108
+l-177 -159l213 104q37 -62 58 -141l-224 -78l237 14q5 -31 5 -77zM1352 640q0 160 -78.5 295.5t-213 214t-292.5 78.5q-119 0 -227 -46.5t-186.5 -125t-124.5 -187.5t-46 -229q0 -119 46 -228t124.5 -187.5t186.5 -125t227 -46.5q158 0 292.5 78.5t213 214t78.5 294.5z
+M1425 1023v-766l-657 -383l-657 383v766l657 383zM768 -183l708 412v823l-708 411l-708 -411v-823zM1536 1088v-896l-768 -448l-768 448v896l768 448z" />
+    <glyph glyph-name="uniF2B1" unicode="&#xf2b1;" horiz-adv-x="1664" 
+d="M339 1318h691l-26 -72h-665q-110 0 -188.5 -79t-78.5 -189v-771q0 -95 60.5 -169.5t153.5 -93.5q23 -5 98 -5v-72h-45q-140 0 -239.5 100t-99.5 240v771q0 140 99.5 240t239.5 100zM1190 1536h247l-482 -1294q-23 -61 -40.5 -103.5t-45 -98t-54 -93.5t-64.5 -78.5
+t-79.5 -65t-95.5 -41t-116 -18.5v195q163 26 220 182q20 52 20 105q0 54 -20 106l-285 733h228l187 -585zM1664 978v-1111h-795q37 55 45 73h678v1038q0 85 -49.5 155t-129.5 99l25 67q101 -34 163.5 -123.5t62.5 -197.5z" />
+    <glyph glyph-name="uniF2B2" unicode="&#xf2b2;" horiz-adv-x="1792" 
+d="M852 1227q0 -29 -17 -52.5t-45 -23.5t-45 23.5t-17 52.5t17 52.5t45 23.5t45 -23.5t17 -52.5zM688 -149v114q0 30 -20.5 51.5t-50.5 21.5t-50 -21.5t-20 -51.5v-114q0 -30 20.5 -52t49.5 -22q30 0 50.5 22t20.5 52zM860 -149v114q0 30 -20 51.5t-50 21.5t-50.5 -21.5
+t-20.5 -51.5v-114q0 -30 20.5 -52t50.5 -22q29 0 49.5 22t20.5 52zM1034 -149v114q0 30 -20.5 51.5t-50.5 21.5t-50.5 -21.5t-20.5 -51.5v-114q0 -30 20.5 -52t50.5 -22t50.5 22t20.5 52zM1208 -149v114q0 30 -20.5 51.5t-50.5 21.5t-50.5 -21.5t-20.5 -51.5v-114
+q0 -30 20.5 -52t50.5 -22t50.5 22t20.5 52zM1476 535q-84 -160 -232 -259.5t-323 -99.5q-123 0 -229.5 51.5t-178.5 137t-113 197.5t-41 232q0 88 21 174q-104 -175 -104 -390q0 -162 65 -312t185 -251q30 57 91 57q56 0 86 -50q32 50 87 50q56 0 86 -50q32 50 87 50t87 -50
+q30 50 86 50q28 0 52.5 -15.5t37.5 -40.5q112 94 177 231.5t73 287.5zM1326 564q0 75 -72 75q-17 0 -47 -6q-95 -19 -149 -19q-226 0 -226 243q0 86 30 204q-83 -127 -83 -275q0 -150 89 -260.5t235 -110.5q111 0 210 70q13 48 13 79zM884 1223q0 50 -32 89.5t-81 39.5
+t-81 -39.5t-32 -89.5q0 -51 31.5 -90.5t81.5 -39.5t81.5 39.5t31.5 90.5zM1513 884q0 96 -37.5 179t-113 137t-173.5 54q-77 0 -149 -35t-127 -94q-48 -159 -48 -268q0 -104 45.5 -157t147.5 -53q53 0 142 19q36 6 53 6q51 0 77.5 -28t26.5 -80q0 -26 -4 -46
+q75 68 117.5 165.5t42.5 200.5zM1792 667q0 -111 -33.5 -249.5t-93.5 -204.5q-58 -64 -195 -142.5t-228 -104.5l-4 -1v-114q0 -43 -29.5 -75t-72.5 -32q-56 0 -86 50q-32 -50 -87 -50t-87 50q-30 -50 -86 -50q-55 0 -87 50q-30 -50 -86 -50q-47 0 -75 33.5t-28 81.5
+q-90 -68 -198 -68q-118 0 -211 80q54 1 106 20q-113 31 -182 127q32 -7 71 -7q89 0 164 46q-192 192 -240 306q-24 56 -24 160q0 57 9 125.5t31.5 146.5t55 141t86.5 105t120 42q59 0 81 -52q19 29 42 54q2 3 12 13t13 16q10 15 23 38t25 42t28 39q87 111 211.5 177
+t260.5 66q35 0 62 -4q59 64 146 64q83 0 140 -57q5 -5 5 -12q0 -5 -6 -13.5t-12.5 -16t-16 -17l-10.5 -10.5q17 -6 36 -18t19 -24q0 -6 -16 -25q157 -138 197 -378q25 30 60 30q45 0 100 -49q90 -80 90 -279z" />
+    <glyph glyph-name="uniF2B3" unicode="&#xf2b3;" 
+d="M917 631q0 33 -6 64h-362v-132h217q-12 -76 -74.5 -120.5t-142.5 -44.5q-99 0 -169 71.5t-70 170.5t70 170.5t169 71.5q93 0 153 -59l104 101q-108 100 -257 100q-160 0 -272 -112.5t-112 -271.5t112 -271.5t272 -112.5q165 0 266.5 105t101.5 270zM1262 585h109v110
+h-109v110h-110v-110h-110v-110h110v-110h110v110zM1536 640q0 -209 -103 -385.5t-279.5 -279.5t-385.5 -103t-385.5 103t-279.5 279.5t-103 385.5t103 385.5t279.5 279.5t385.5 103t385.5 -103t279.5 -279.5t103 -385.5z" />
+    <glyph glyph-name="uniF2B4" unicode="&#xf2b4;" 
+d="M1536 1024v-839q0 -48 -49 -62q-174 -52 -338 -52q-73 0 -215.5 29.5t-227.5 29.5q-164 0 -370 -48v-338h-160v1368q-63 25 -101 81t-38 124q0 91 64 155t155 64t155 -64t64 -155q0 -68 -38 -124t-101 -81v-68q190 44 343 44q99 0 198 -15q14 -2 111.5 -22.5t149.5 -20.5
+q77 0 165 18q11 2 80 21t89 19q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="uniF2B5" unicode="&#xf2b5;" horiz-adv-x="2304" 
+d="M192 384q40 0 56 32t0 64t-56 32t-56 -32t0 -64t56 -32zM1665 442q-10 13 -38.5 50t-41.5 54t-38 49t-42.5 53t-40.5 47t-45 49l-125 -140q-83 -94 -208.5 -92t-205.5 98q-57 69 -56.5 158t58.5 157l177 206q-22 11 -51 16.5t-47.5 6t-56.5 -0.5t-49 -1q-92 0 -158 -66
+l-158 -158h-155v-544q5 0 21 0.5t22 0t19.5 -2t20.5 -4.5t17.5 -8.5t18.5 -13.5l297 -292q115 -111 227 -111q78 0 125 47q57 -20 112.5 8t72.5 85q74 -6 127 44q20 18 36 45.5t14 50.5q10 -10 43 -10q43 0 77 21t49.5 53t12 71.5t-30.5 73.5zM1824 384h96v512h-93l-157 180
+q-66 76 -169 76h-167q-89 0 -146 -67l-209 -243q-28 -33 -28 -75t27 -75q43 -51 110 -52t111 49l193 218q25 23 53.5 21.5t47 -27t8.5 -56.5q16 -19 56 -63t60 -68q29 -36 82.5 -105.5t64.5 -84.5q52 -66 60 -140zM2112 384q40 0 56 32t0 64t-56 32t-56 -32t0 -64t56 -32z
+M2304 960v-640q0 -26 -19 -45t-45 -19h-434q-27 -65 -82 -106.5t-125 -51.5q-33 -48 -80.5 -81.5t-102.5 -45.5q-42 -53 -104.5 -81.5t-128.5 -24.5q-60 -34 -126 -39.5t-127.5 14t-117 53.5t-103.5 81l-287 282h-358q-26 0 -45 19t-19 45v672q0 26 19 45t45 19h421
+q14 14 47 48t47.5 48t44 40t50.5 37.5t51 25.5t62 19.5t68 5.5h117q99 0 181 -56q82 56 181 56h167q35 0 67 -6t56.5 -14.5t51.5 -26.5t44.5 -31t43 -39.5t39 -42t41 -48t41.5 -48.5h355q26 0 45 -19t19 -45z" />
+    <glyph glyph-name="uniF2B6" unicode="&#xf2b6;" horiz-adv-x="1792" 
+d="M1792 882v-978q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v978q0 15 11 24q8 7 39 34.5t41.5 36t45.5 37.5t70 55.5t96 73t143.5 107t192.5 140.5q5 4 52.5 40t71.5 52.5t64 35t69 18.5t69 -18.5t65 -35.5t71 -52t52 -40q110 -80 192.5 -140.5t143.5 -107
+t96 -73t70 -55.5t45.5 -37.5t41.5 -36t39 -34.5q11 -9 11 -24zM1228 297q263 191 345 252q11 8 12.5 20.5t-6.5 23.5l-38 52q-8 11 -21 12.5t-24 -6.5q-231 -169 -343 -250q-5 -3 -52 -39t-71.5 -52.5t-64.5 -35t-69 -18.5t-69 18.5t-64.5 35t-71.5 52.5t-52 39
+q-186 134 -343 250q-11 8 -24 6.5t-21 -12.5l-38 -52q-8 -11 -6.5 -23.5t12.5 -20.5q82 -61 345 -252q10 -8 50 -38t65 -47t64 -39.5t77.5 -33.5t75.5 -11t75.5 11t79 34.5t64.5 39.5t65 47.5t48 36.5z" />
+    <glyph glyph-name="uniF2B7" unicode="&#xf2b7;" horiz-adv-x="1792" 
+d="M1474 623l39 -51q8 -11 6.5 -23.5t-11.5 -20.5q-43 -34 -126.5 -98.5t-146.5 -113t-67 -51.5q-39 -32 -60 -48t-60.5 -41t-76.5 -36.5t-74 -11.5h-1h-1q-37 0 -74 11.5t-76 36.5t-61 41.5t-60 47.5q-5 4 -65 50.5t-143.5 111t-122.5 94.5q-11 8 -12.5 20.5t6.5 23.5
+l37 52q8 11 21.5 13t24.5 -7q94 -73 306 -236q5 -4 43.5 -35t60.5 -46.5t56.5 -32.5t58.5 -17h1h1q24 0 58.5 17t56.5 32.5t60.5 46.5t43.5 35q258 198 313 242q11 8 24 6.5t21 -12.5zM1664 -96v928q-90 83 -159 139q-91 74 -389 304q-3 2 -43 35t-61 48t-56 32.5t-59 17.5
+h-1h-1q-24 0 -59 -17.5t-56 -32.5t-61 -48t-43 -35q-215 -166 -315.5 -245.5t-129.5 -104t-82 -74.5q-14 -12 -21 -19v-928q0 -13 9.5 -22.5t22.5 -9.5h1472q13 0 22.5 9.5t9.5 22.5zM1792 832v-928q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v928q0 56 41 94
+q123 114 350 290.5t233 181.5q36 30 59 47.5t61.5 42t76 36.5t74.5 12h1h1q37 0 74.5 -12t76 -36.5t61.5 -42t59 -47.5q43 -36 156 -122t226 -177t201 -173q41 -38 41 -94z" />
+    <glyph glyph-name="uniF2B8" unicode="&#xf2b8;" 
+d="M330 1l202 -214l-34 236l-216 213zM556 -225l274 218l-11 245l-300 -215zM245 413l227 -213l-48 327l-245 204zM495 189l317 214l-14 324l-352 -200zM843 178l95 -80l-2 239l-103 79q0 -1 1 -8.5t0 -12t-5 -7.5l-78 -52l85 -70q7 -6 7 -88zM138 930l256 -200l-68 465
+l-279 173zM1173 267l15 234l-230 -164l2 -240zM417 722l373 194l-19 441l-423 -163zM1270 357l20 233l-226 142l-2 -105l144 -95q6 -4 4 -9l-7 -119zM1461 496l30 222l-179 -128l-20 -228zM1273 329l-71 49l-8 -117q0 -5 -4 -8l-234 -187q-7 -5 -14 0l-98 83l7 -161
+q0 -5 -4 -8l-293 -234q-4 -2 -6 -2q-8 2 -8 3l-228 242q-4 4 -59 277q-2 7 5 11l61 37q-94 86 -95 92l-72 351q-2 7 6 12l94 45q-133 100 -135 108l-96 466q-2 10 7 13l433 135q5 0 8 -1l317 -153q6 -4 6 -9l20 -463q0 -7 -6 -10l-118 -61l126 -85q5 -2 5 -8l5 -123l121 74
+q5 4 11 0l84 -56l3 110q0 6 5 9l206 126q6 3 11 0l245 -135q4 -4 5 -7t-6.5 -60t-17.5 -124.5t-10 -70.5q0 -5 -4 -7l-191 -153q-6 -5 -13 0z" />
+    <glyph glyph-name="uniF2B9" unicode="&#xf2b9;" horiz-adv-x="1664" 
+d="M1201 298q0 57 -5.5 107t-21 100.5t-39.5 86t-64 58t-91 22.5q-6 -4 -33.5 -20.5t-42.5 -24.5t-40.5 -20t-49 -17t-46.5 -5t-46.5 5t-49 17t-40.5 20t-42.5 24.5t-33.5 20.5q-51 0 -91 -22.5t-64 -58t-39.5 -86t-21 -100.5t-5.5 -107q0 -73 42 -121.5t103 -48.5h576
+q61 0 103 48.5t42 121.5zM1028 892q0 108 -76.5 184t-183.5 76t-183.5 -76t-76.5 -184q0 -107 76.5 -183t183.5 -76t183.5 76t76.5 183zM1664 352v-192q0 -14 -9 -23t-23 -9h-96v-224q0 -66 -47 -113t-113 -47h-1216q-66 0 -113 47t-47 113v1472q0 66 47 113t113 47h1216
+q66 0 113 -47t47 -113v-224h96q14 0 23 -9t9 -23v-192q0 -14 -9 -23t-23 -9h-96v-128h96q14 0 23 -9t9 -23v-192q0 -14 -9 -23t-23 -9h-96v-128h96q14 0 23 -9t9 -23z" />
+    <glyph glyph-name="uniF2BA" unicode="&#xf2ba;" horiz-adv-x="1664" 
+d="M1028 892q0 -107 -76.5 -183t-183.5 -76t-183.5 76t-76.5 183q0 108 76.5 184t183.5 76t183.5 -76t76.5 -184zM980 672q46 0 82.5 -17t60 -47.5t39.5 -67t24 -81t11.5 -82.5t3.5 -79q0 -67 -39.5 -118.5t-105.5 -51.5h-576q-66 0 -105.5 51.5t-39.5 118.5q0 48 4.5 93.5
+t18.5 98.5t36.5 91.5t63 64.5t93.5 26h5q7 -4 32 -19.5t35.5 -21t33 -17t37 -16t35 -9t39.5 -4.5t39.5 4.5t35 9t37 16t33 17t35.5 21t32 19.5zM1664 928q0 -13 -9.5 -22.5t-22.5 -9.5h-96v-128h96q13 0 22.5 -9.5t9.5 -22.5v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-96v-128h96
+q13 0 22.5 -9.5t9.5 -22.5v-192q0 -13 -9.5 -22.5t-22.5 -9.5h-96v-224q0 -66 -47 -113t-113 -47h-1216q-66 0 -113 47t-47 113v1472q0 66 47 113t113 47h1216q66 0 113 -47t47 -113v-224h96q13 0 22.5 -9.5t9.5 -22.5v-192zM1408 -96v1472q0 13 -9.5 22.5t-22.5 9.5h-1216
+q-13 0 -22.5 -9.5t-9.5 -22.5v-1472q0 -13 9.5 -22.5t22.5 -9.5h1216q13 0 22.5 9.5t9.5 22.5z" />
+    <glyph glyph-name="uniF2BB" unicode="&#xf2bb;" horiz-adv-x="2048" 
+d="M1024 405q0 64 -9 117.5t-29.5 103t-60.5 78t-97 28.5q-6 -4 -30 -18t-37.5 -21.5t-35.5 -17.5t-43 -14.5t-42 -4.5t-42 4.5t-43 14.5t-35.5 17.5t-37.5 21.5t-30 18q-57 0 -97 -28.5t-60.5 -78t-29.5 -103t-9 -117.5t37 -106.5t91 -42.5h512q54 0 91 42.5t37 106.5z
+M867 925q0 94 -66.5 160.5t-160.5 66.5t-160.5 -66.5t-66.5 -160.5t66.5 -160.5t160.5 -66.5t160.5 66.5t66.5 160.5zM1792 416v64q0 14 -9 23t-23 9h-576q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h576q14 0 23 9t9 23zM1792 676v56q0 15 -10.5 25.5t-25.5 10.5h-568
+q-15 0 -25.5 -10.5t-10.5 -25.5v-56q0 -15 10.5 -25.5t25.5 -10.5h568q15 0 25.5 10.5t10.5 25.5zM1792 928v64q0 14 -9 23t-23 9h-576q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h576q14 0 23 9t9 23zM2048 1248v-1216q0 -66 -47 -113t-113 -47h-352v96q0 14 -9 23t-23 9
+h-64q-14 0 -23 -9t-9 -23v-96h-768v96q0 14 -9 23t-23 9h-64q-14 0 -23 -9t-9 -23v-96h-352q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1728q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2BC" unicode="&#xf2bc;" horiz-adv-x="2048" 
+d="M1024 405q0 -64 -37 -106.5t-91 -42.5h-512q-54 0 -91 42.5t-37 106.5t9 117.5t29.5 103t60.5 78t97 28.5q6 -4 30 -18t37.5 -21.5t35.5 -17.5t43 -14.5t42 -4.5t42 4.5t43 14.5t35.5 17.5t37.5 21.5t30 18q57 0 97 -28.5t60.5 -78t29.5 -103t9 -117.5zM867 925
+q0 -94 -66.5 -160.5t-160.5 -66.5t-160.5 66.5t-66.5 160.5t66.5 160.5t160.5 66.5t160.5 -66.5t66.5 -160.5zM1792 480v-64q0 -14 -9 -23t-23 -9h-576q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h576q14 0 23 -9t9 -23zM1792 732v-56q0 -15 -10.5 -25.5t-25.5 -10.5h-568
+q-15 0 -25.5 10.5t-10.5 25.5v56q0 15 10.5 25.5t25.5 10.5h568q15 0 25.5 -10.5t10.5 -25.5zM1792 992v-64q0 -14 -9 -23t-23 -9h-576q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h576q14 0 23 -9t9 -23zM1920 32v1216q0 13 -9.5 22.5t-22.5 9.5h-1728q-13 0 -22.5 -9.5
+t-9.5 -22.5v-1216q0 -13 9.5 -22.5t22.5 -9.5h352v96q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-96h768v96q0 14 9 23t23 9h64q14 0 23 -9t9 -23v-96h352q13 0 22.5 9.5t9.5 22.5zM2048 1248v-1216q0 -66 -47 -113t-113 -47h-1728q-66 0 -113 47t-47 113v1216q0 66 47 113
+t113 47h1728q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2BD" unicode="&#xf2bd;" horiz-adv-x="1792" 
+d="M1523 197q-22 155 -87.5 257.5t-184.5 118.5q-67 -74 -159.5 -115.5t-195.5 -41.5t-195.5 41.5t-159.5 115.5q-119 -16 -184.5 -118.5t-87.5 -257.5q106 -150 271 -237.5t356 -87.5t356 87.5t271 237.5zM1280 896q0 159 -112.5 271.5t-271.5 112.5t-271.5 -112.5
+t-112.5 -271.5t112.5 -271.5t271.5 -112.5t271.5 112.5t112.5 271.5zM1792 640q0 -182 -71 -347.5t-190.5 -286t-285.5 -191.5t-349 -71q-182 0 -348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF2BE" unicode="&#xf2be;" horiz-adv-x="1792" 
+d="M896 1536q182 0 348 -71t286 -191t191 -286t71 -348q0 -181 -70.5 -347t-190.5 -286t-286 -191.5t-349 -71.5t-349 71t-285.5 191.5t-190.5 286t-71 347.5t71 348t191 286t286 191t348 71zM1515 185q149 205 149 455q0 156 -61 298t-164 245t-245 164t-298 61t-298 -61
+t-245 -164t-164 -245t-61 -298q0 -250 149 -455q66 327 306 327q131 -128 313 -128t313 128q240 0 306 -327zM1280 832q0 159 -112.5 271.5t-271.5 112.5t-271.5 -112.5t-112.5 -271.5t112.5 -271.5t271.5 -112.5t271.5 112.5t112.5 271.5z" />
+    <glyph glyph-name="uniF2C0" unicode="&#xf2c0;" 
+d="M1201 752q47 -14 89.5 -38t89 -73t79.5 -115.5t55 -172t22 -236.5q0 -154 -100 -263.5t-241 -109.5h-854q-141 0 -241 109.5t-100 263.5q0 131 22 236.5t55 172t79.5 115.5t89 73t89.5 38q-79 125 -79 272q0 104 40.5 198.5t109.5 163.5t163.5 109.5t198.5 40.5
+t198.5 -40.5t163.5 -109.5t109.5 -163.5t40.5 -198.5q0 -147 -79 -272zM768 1408q-159 0 -271.5 -112.5t-112.5 -271.5t112.5 -271.5t271.5 -112.5t271.5 112.5t112.5 271.5t-112.5 271.5t-271.5 112.5zM1195 -128q88 0 150.5 71.5t62.5 173.5q0 239 -78.5 377t-225.5 145
+q-145 -127 -336 -127t-336 127q-147 -7 -225.5 -145t-78.5 -377q0 -102 62.5 -173.5t150.5 -71.5h854z" />
+    <glyph glyph-name="uniF2C1" unicode="&#xf2c1;" horiz-adv-x="1280" 
+d="M1024 278q0 -64 -37 -107t-91 -43h-512q-54 0 -91 43t-37 107t9 118t29.5 104t61 78.5t96.5 28.5q80 -75 188 -75t188 75q56 0 96.5 -28.5t61 -78.5t29.5 -104t9 -118zM870 797q0 -94 -67.5 -160.5t-162.5 -66.5t-162.5 66.5t-67.5 160.5t67.5 160.5t162.5 66.5
+t162.5 -66.5t67.5 -160.5zM1152 -96v1376h-1024v-1376q0 -13 9.5 -22.5t22.5 -9.5h960q13 0 22.5 9.5t9.5 22.5zM1280 1376v-1472q0 -66 -47 -113t-113 -47h-960q-66 0 -113 47t-47 113v1472q0 66 47 113t113 47h352v-96q0 -14 9 -23t23 -9h192q14 0 23 9t9 23v96h352
+q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2C2" unicode="&#xf2c2;" horiz-adv-x="2048" 
+d="M896 324q0 54 -7.5 100.5t-24.5 90t-51 68.5t-81 25q-64 -64 -156 -64t-156 64q-47 0 -81 -25t-51 -68.5t-24.5 -90t-7.5 -100.5q0 -55 31.5 -93.5t75.5 -38.5h426q44 0 75.5 38.5t31.5 93.5zM768 768q0 80 -56 136t-136 56t-136 -56t-56 -136t56 -136t136 -56t136 56
+t56 136zM1792 288v64q0 14 -9 23t-23 9h-704q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h704q14 0 23 9t9 23zM1408 544v64q0 14 -9 23t-23 9h-320q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h320q14 0 23 9t9 23zM1792 544v64q0 14 -9 23t-23 9h-192q-14 0 -23 -9t-9 -23
+v-64q0 -14 9 -23t23 -9h192q14 0 23 9t9 23zM1792 800v64q0 14 -9 23t-23 9h-704q-14 0 -23 -9t-9 -23v-64q0 -14 9 -23t23 -9h704q14 0 23 9t9 23zM128 1152h1792v96q0 14 -9 23t-23 9h-1728q-14 0 -23 -9t-9 -23v-96zM2048 1248v-1216q0 -66 -47 -113t-113 -47h-1728
+q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1728q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2C3" unicode="&#xf2c3;" horiz-adv-x="2048" 
+d="M896 324q0 -55 -31.5 -93.5t-75.5 -38.5h-426q-44 0 -75.5 38.5t-31.5 93.5q0 54 7.5 100.5t24.5 90t51 68.5t81 25q64 -64 156 -64t156 64q47 0 81 -25t51 -68.5t24.5 -90t7.5 -100.5zM768 768q0 -80 -56 -136t-136 -56t-136 56t-56 136t56 136t136 56t136 -56t56 -136z
+M1792 352v-64q0 -14 -9 -23t-23 -9h-704q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h704q14 0 23 -9t9 -23zM1408 608v-64q0 -14 -9 -23t-23 -9h-320q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h320q14 0 23 -9t9 -23zM1792 608v-64q0 -14 -9 -23t-23 -9h-192q-14 0 -23 9t-9 23v64
+q0 14 9 23t23 9h192q14 0 23 -9t9 -23zM1792 864v-64q0 -14 -9 -23t-23 -9h-704q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h704q14 0 23 -9t9 -23zM1920 32v1120h-1792v-1120q0 -13 9.5 -22.5t22.5 -9.5h1728q13 0 22.5 9.5t9.5 22.5zM2048 1248v-1216q0 -66 -47 -113t-113 -47
+h-1728q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1728q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2C4" unicode="&#xf2c4;" horiz-adv-x="1792" 
+d="M1255 749q0 318 -105 474.5t-330 156.5q-222 0 -326 -157t-104 -474q0 -316 104 -471.5t326 -155.5q74 0 131 17q-22 43 -39 73t-44 65t-53.5 56.5t-63 36t-77.5 14.5q-46 0 -79 -16l-49 97q105 91 276 91q132 0 215.5 -54t150.5 -155q67 149 67 402zM1645 117h117
+q3 -27 -2 -67t-26.5 -95t-58 -100.5t-107 -78t-162.5 -32.5q-71 0 -130.5 19t-105.5 56t-79 78t-66 96q-97 -27 -205 -27q-150 0 -292.5 58t-253 158.5t-178 249t-67.5 317.5q0 170 67.5 319.5t178.5 250.5t253.5 159t291.5 58q121 0 238.5 -36t217 -106t176 -164.5
+t119.5 -219t43 -261.5q0 -190 -80.5 -347.5t-218.5 -264.5q47 -70 93.5 -106.5t104.5 -36.5q61 0 94 37.5t38 85.5z" />
+    <glyph glyph-name="uniF2C5" unicode="&#xf2c5;" horiz-adv-x="2304" 
+d="M453 -101q0 -21 -16 -37.5t-37 -16.5q-1 0 -13 3q-63 15 -162 140q-225 284 -225 676q0 341 213 614q39 51 95 103.5t94 52.5q19 0 35 -13.5t16 -32.5q0 -27 -63 -90q-98 -102 -147 -184q-119 -199 -119 -449q0 -281 123 -491q50 -85 136 -173q2 -3 14.5 -16t19.5 -21
+t17 -20.5t14.5 -23.5t4.5 -21zM1796 33q0 -29 -17.5 -48.5t-46.5 -19.5h-1081q-26 0 -45 19t-19 45q0 29 17.5 48.5t46.5 19.5h1081q26 0 45 -19t19 -45zM1581 644q0 -134 -67 -233q-25 -38 -69.5 -78.5t-83.5 -60.5q-16 -10 -27 -10q-7 0 -15 6t-8 12q0 9 19 30t42 46
+t42 67.5t19 88.5q0 76 -35 130q-29 42 -46 42q-3 0 -3 -5q0 -12 7.5 -35.5t7.5 -36.5q0 -22 -21.5 -35t-44.5 -13q-66 0 -66 76q0 15 1.5 44t1.5 44q0 25 -10 46q-13 25 -42 53.5t-51 28.5q-5 0 -7 -0.5t-3.5 -2.5t-1.5 -6q0 -2 16 -26t16 -54q0 -37 -19 -68t-46 -54
+t-53.5 -46t-45.5 -54t-19 -68q0 -98 42 -160q29 -43 79 -63q16 -5 17 -10q1 -2 1 -5q0 -16 -18 -16q-6 0 -33 11q-119 43 -195 139.5t-76 218.5q0 55 24.5 115.5t60 115t70.5 108.5t59.5 113.5t24.5 111.5q0 53 -25 94q-29 48 -56 64q-19 9 -19 21q0 20 41 20q50 0 110 -29
+q41 -19 71 -44.5t49.5 -51t33.5 -62.5t22 -69t16 -80q0 -1 3 -17.5t4.5 -25t5.5 -25t9 -27t11 -21.5t14.5 -16.5t18.5 -5.5q23 0 37 14t14 37q0 25 -20 67t-20 52t10 10q27 0 93 -70q72 -76 102.5 -156t30.5 -186zM2304 615q0 -274 -138 -503q-19 -32 -48 -72t-68 -86.5
+t-81 -77t-74 -30.5q-16 0 -31 15.5t-15 31.5q0 15 29 50.5t68.5 77t48.5 52.5q183 230 183 531q0 131 -20.5 235t-72.5 211q-58 119 -163 228q-2 3 -13 13.5t-16.5 16.5t-15 17.5t-15 20t-9.5 18.5t-4 19q0 19 16 35.5t35 16.5q70 0 196 -169q98 -131 146 -273t60 -314
+q2 -42 2 -64z" />
+    <glyph glyph-name="uniF2C6" unicode="&#xf2c6;" horiz-adv-x="1792" 
+d="M1189 229l147 693q9 44 -10.5 63t-51.5 7l-864 -333q-29 -11 -39.5 -25t-2.5 -26.5t32 -19.5l221 -69l513 323q21 14 32 6q7 -5 -4 -15l-415 -375v0v0l-16 -228q23 0 45 22l108 104l224 -165q64 -36 81 38zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71
+t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF2C7" unicode="&#xf2c7;" horiz-adv-x="1024" 
+d="M640 192q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 60 35 110t93 71v907h128v-907q58 -21 93 -71t35 -110zM768 192q0 77 -34 144t-94 112v768q0 80 -56 136t-136 56t-136 -56t-56 -136v-768q-60 -45 -94 -112t-34 -144q0 -133 93.5 -226.5t226.5 -93.5t226.5 93.5
+t93.5 226.5zM896 192q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 182 128 313v711q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5v-711q128 -131 128 -313zM1024 768v-128h-192v128h192zM1024 1024v-128h-192v128h192zM1024 1280v-128h-192
+v128h192z" />
+    <glyph glyph-name="uniF2C8" unicode="&#xf2c8;" horiz-adv-x="1024" 
+d="M640 192q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 60 35 110t93 71v651h128v-651q58 -21 93 -71t35 -110zM768 192q0 77 -34 144t-94 112v768q0 80 -56 136t-136 56t-136 -56t-56 -136v-768q-60 -45 -94 -112t-34 -144q0 -133 93.5 -226.5t226.5 -93.5t226.5 93.5
+t93.5 226.5zM896 192q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 182 128 313v711q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5v-711q128 -131 128 -313zM1024 768v-128h-192v128h192zM1024 1024v-128h-192v128h192zM1024 1280v-128h-192
+v128h192z" />
+    <glyph glyph-name="uniF2C9" unicode="&#xf2c9;" horiz-adv-x="1024" 
+d="M640 192q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 60 35 110t93 71v395h128v-395q58 -21 93 -71t35 -110zM768 192q0 77 -34 144t-94 112v768q0 80 -56 136t-136 56t-136 -56t-56 -136v-768q-60 -45 -94 -112t-34 -144q0 -133 93.5 -226.5t226.5 -93.5t226.5 93.5
+t93.5 226.5zM896 192q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 182 128 313v711q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5v-711q128 -131 128 -313zM1024 768v-128h-192v128h192zM1024 1024v-128h-192v128h192zM1024 1280v-128h-192
+v128h192z" />
+    <glyph glyph-name="uniF2CA" unicode="&#xf2ca;" horiz-adv-x="1024" 
+d="M640 192q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 60 35 110t93 71v139h128v-139q58 -21 93 -71t35 -110zM768 192q0 77 -34 144t-94 112v768q0 80 -56 136t-136 56t-136 -56t-56 -136v-768q-60 -45 -94 -112t-34 -144q0 -133 93.5 -226.5t226.5 -93.5t226.5 93.5
+t93.5 226.5zM896 192q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 182 128 313v711q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5v-711q128 -131 128 -313zM1024 768v-128h-192v128h192zM1024 1024v-128h-192v128h192zM1024 1280v-128h-192
+v128h192z" />
+    <glyph glyph-name="uniF2CB" unicode="&#xf2cb;" horiz-adv-x="1024" 
+d="M640 192q0 -80 -56 -136t-136 -56t-136 56t-56 136q0 79 56 135.5t136 56.5t136 -56.5t56 -135.5zM768 192q0 77 -34 144t-94 112v768q0 80 -56 136t-136 56t-136 -56t-56 -136v-768q-60 -45 -94 -112t-34 -144q0 -133 93.5 -226.5t226.5 -93.5t226.5 93.5t93.5 226.5z
+M896 192q0 -185 -131.5 -316.5t-316.5 -131.5t-316.5 131.5t-131.5 316.5q0 182 128 313v711q0 133 93.5 226.5t226.5 93.5t226.5 -93.5t93.5 -226.5v-711q128 -131 128 -313zM1024 768v-128h-192v128h192zM1024 1024v-128h-192v128h192zM1024 1280v-128h-192v128h192z" />
+    <glyph glyph-name="uniF2CC" unicode="&#xf2cc;" horiz-adv-x="1920" 
+d="M1433 1287q10 -10 10 -23t-10 -23l-626 -626q-10 -10 -23 -10t-23 10l-82 82q-10 10 -10 23t10 23l44 44q-72 91 -81.5 207t46.5 215q-74 71 -176 71q-106 0 -181 -75t-75 -181v-1280h-256v1280q0 104 40.5 198.5t109.5 163.5t163.5 109.5t198.5 40.5q106 0 201 -41
+t166 -115q94 39 197 24.5t185 -79.5l44 44q10 10 23 10t23 -10zM1344 1024q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1600 896q-26 0 -45 19t-19 45t19 45t45 19t45 -19t19 -45t-19 -45t-45 -19zM1856 1024q26 0 45 -19t19 -45t-19 -45t-45 -19
+t-45 19t-19 45t19 45t45 19zM1216 896q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1408 832q0 26 19 45t45 19t45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45zM1728 896q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1088 768
+q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1344 640q-26 0 -45 19t-19 45t19 45t45 19t45 -19t19 -45t-19 -45t-45 -19zM1600 768q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1216 512q-26 0 -45 19t-19 45t19 45t45 19t45 -19
+t19 -45t-19 -45t-45 -19zM1472 640q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1088 512q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1344 512q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1216 384
+q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19zM1088 256q26 0 45 -19t19 -45t-19 -45t-45 -19t-45 19t-19 45t19 45t45 19z" />
+    <glyph glyph-name="uniF2CD" unicode="&#xf2cd;" horiz-adv-x="1792" 
+d="M1664 448v-192q0 -169 -128 -286v-194q0 -14 -9 -23t-23 -9h-64q-14 0 -23 9t-9 23v118q-63 -22 -128 -22h-768q-65 0 -128 22v-110q0 -17 -9.5 -28.5t-22.5 -11.5h-64q-13 0 -22.5 11.5t-9.5 28.5v186q-128 117 -128 286v192h1536zM704 864q0 -14 -9 -23t-23 -9t-23 9
+t-9 23t9 23t23 9t23 -9t9 -23zM768 928q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM704 992q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM832 992q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM768 1056q0 -14 -9 -23t-23 -9t-23 9
+t-9 23t9 23t23 9t23 -9t9 -23zM704 1120q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM1792 608v-64q0 -14 -9 -23t-23 -9h-1728q-14 0 -23 9t-9 23v64q0 14 9 23t23 9h96v640q0 106 75 181t181 75q108 0 184 -78q46 19 98 12t93 -39l22 22q11 11 22 0l42 -42
+q11 -11 0 -22l-314 -314q-11 -11 -22 0l-42 42q-11 11 0 22l22 22q-36 46 -40.5 104t23.5 108q-37 35 -88 35q-53 0 -90.5 -37.5t-37.5 -90.5v-640h1504q14 0 23 -9t9 -23zM896 1056q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM832 1120q0 -14 -9 -23t-23 -9
+t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM768 1184q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM960 1120q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM896 1184q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM832 1248q0 -14 -9 -23
+t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM1024 1184q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM960 1248q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23zM1088 1248q0 -14 -9 -23t-23 -9t-23 9t-9 23t9 23t23 9t23 -9t9 -23z" />
+    <glyph glyph-name="uniF2CE" unicode="&#xf2ce;" 
+d="M994 344q0 -86 -17 -197q-31 -215 -55 -313q-22 -90 -152 -90t-152 90q-24 98 -55 313q-17 110 -17 197q0 168 224 168t224 -168zM1536 768q0 -240 -134 -434t-350 -280q-8 -3 -15 3t-6 15q7 48 10 66q4 32 6 47q1 9 9 12q159 81 255.5 234t96.5 337q0 180 -91 330.5
+t-247 234.5t-337 74q-124 -7 -237 -61t-193.5 -140.5t-128 -202t-46.5 -240.5q1 -184 99 -336.5t257 -231.5q7 -3 9 -12q3 -21 6 -45q1 -9 5 -32.5t6 -35.5q1 -9 -6.5 -15t-15.5 -2q-148 58 -261 169.5t-173.5 264t-52.5 319.5q7 143 66 273.5t154.5 227t225 157.5t272.5 70
+q164 10 315.5 -46.5t261 -160.5t175 -250.5t65.5 -308.5zM994 800q0 -93 -65.5 -158.5t-158.5 -65.5t-158.5 65.5t-65.5 158.5t65.5 158.5t158.5 65.5t158.5 -65.5t65.5 -158.5zM1282 768q0 -122 -53.5 -228.5t-146.5 -177.5q-8 -6 -16 -2t-10 14q-6 52 -29 92q-7 10 3 20
+q58 54 91 127t33 155q0 111 -58.5 204t-157.5 141.5t-212 36.5q-133 -15 -229 -113t-109 -231q-10 -92 23.5 -176t98.5 -144q10 -10 3 -20q-24 -41 -29 -93q-2 -9 -10 -13t-16 2q-95 74 -148.5 183t-51.5 234q3 131 69 244t177 181.5t241 74.5q144 7 268 -60t196.5 -187.5
+t72.5 -263.5z" />
+    <glyph glyph-name="uniF2D0" unicode="&#xf2d0;" horiz-adv-x="1792" 
+d="M256 128h1280v768h-1280v-768zM1792 1248v-1216q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1472q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2D1" unicode="&#xf2d1;" horiz-adv-x="1792" 
+d="M1792 224v-192q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v192q0 66 47 113t113 47h1472q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2D2" unicode="&#xf2d2;" horiz-adv-x="2048" 
+d="M256 0h768v512h-768v-512zM1280 512h512v768h-768v-256h96q66 0 113 -47t47 -113v-352zM2048 1376v-960q0 -66 -47 -113t-113 -47h-608v-352q0 -66 -47 -113t-113 -47h-960q-66 0 -113 47t-47 113v960q0 66 47 113t113 47h608v352q0 66 47 113t113 47h960q66 0 113 -47
+t47 -113z" />
+    <glyph glyph-name="uniF2D3" unicode="&#xf2d3;" horiz-adv-x="1792" 
+d="M1175 215l146 146q10 10 10 23t-10 23l-233 233l233 233q10 10 10 23t-10 23l-146 146q-10 10 -23 10t-23 -10l-233 -233l-233 233q-10 10 -23 10t-23 -10l-146 -146q-10 -10 -10 -23t10 -23l233 -233l-233 -233q-10 -10 -10 -23t10 -23l146 -146q10 -10 23 -10t23 10
+l233 233l233 -233q10 -10 23 -10t23 10zM1792 1248v-1216q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1472q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2D4" unicode="&#xf2d4;" horiz-adv-x="1792" 
+d="M1257 425l-146 -146q-10 -10 -23 -10t-23 10l-169 169l-169 -169q-10 -10 -23 -10t-23 10l-146 146q-10 10 -10 23t10 23l169 169l-169 169q-10 10 -10 23t10 23l146 146q10 10 23 10t23 -10l169 -169l169 169q10 10 23 10t23 -10l146 -146q10 -10 10 -23t-10 -23
+l-169 -169l169 -169q10 -10 10 -23t-10 -23zM256 128h1280v1024h-1280v-1024zM1792 1248v-1216q0 -66 -47 -113t-113 -47h-1472q-66 0 -113 47t-47 113v1216q0 66 47 113t113 47h1472q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2D5" unicode="&#xf2d5;" horiz-adv-x="1792" 
+d="M1070 358l306 564h-654l-306 -564h654zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF2D6" unicode="&#xf2d6;" horiz-adv-x="1794" 
+d="M1291 1060q-15 17 -35 8.5t-26 -28.5t5 -38q14 -17 40 -14.5t34 20.5t-18 52zM895 814q-8 -8 -19.5 -8t-18.5 8q-8 8 -8 19t8 18q7 8 18.5 8t19.5 -8q7 -7 7 -18t-7 -19zM1060 740l-35 -35q-12 -13 -29.5 -13t-30.5 13l-38 38q-12 13 -12 30t12 30l35 35q12 12 29.5 12
+t30.5 -12l38 -39q12 -12 12 -29.5t-12 -29.5zM951 870q-7 -8 -18.5 -8t-19.5 8q-7 8 -7 19t7 19q8 8 19 8t19 -8t8 -19t-8 -19zM1354 968q-34 -64 -107.5 -85.5t-127.5 16.5q-38 28 -61 66.5t-21 87.5t39 92t75.5 53t70.5 -5t70 -51q2 -2 13 -12.5t14.5 -13.5t13 -13.5
+t12.5 -15.5t10 -15.5t8.5 -18t4 -18.5t1 -21t-5 -22t-9.5 -24zM1555 486q3 20 -8.5 34.5t-27.5 21.5t-33 17t-23 20q-40 71 -84 98.5t-113 11.5q19 13 40 18.5t33 4.5l12 -1q2 45 -34 90q6 20 6.5 40.5t-2.5 30.5l-3 10q43 24 71 65t34 91q10 84 -43 150.5t-137 76.5
+q-60 7 -114 -18.5t-82 -74.5q-30 -51 -33.5 -101t14.5 -87t43.5 -64t56.5 -42q-45 4 -88 36t-57 88q-28 108 32 222q-16 21 -29 32q-50 0 -89 -19q19 24 42 37t36 14l13 1q0 50 -13 78q-10 21 -32.5 28.5t-47 -3.5t-37.5 -40q2 4 4 7q-7 -28 -6.5 -75.5t19 -117t48.5 -122.5
+q-25 -14 -47 -36q-35 -16 -85.5 -70.5t-84.5 -101.5l-33 -46q-90 -34 -181 -125.5t-75 -162.5q1 -16 11 -27q-15 -12 -30 -30q-21 -25 -21 -54t21.5 -40t63.5 6q41 19 77 49.5t55 60.5q-2 2 -6.5 5t-20.5 7.5t-33 3.5q23 5 51 12.5t40 10t27.5 6t26 4t23.5 0.5q14 -7 22 34
+q7 37 7 90q0 102 -40 150q106 -103 101 -219q-1 -29 -15 -50t-27 -27l-13 -6q-4 -7 -19 -32t-26 -45.5t-26.5 -52t-25 -61t-17 -63t-6.5 -66.5t10 -63q-35 54 -37 80q-22 -24 -34.5 -39t-33.5 -42t-30.5 -46t-16.5 -41t-0.5 -38t25.5 -27q45 -25 144 64t190.5 221.5
+t122.5 228.5q86 52 145 115.5t86 119.5q47 -93 154 -178q104 -83 167 -80q39 2 46 43zM1794 640q0 -182 -71 -348t-191 -286t-286.5 -191t-348.5 -71t-348.5 71t-286.5 191t-191 286t-71 348t71 348t191 286t286.5 191t348.5 71t348.5 -71t286.5 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF2D7" unicode="&#xf2d7;" 
+d="M518 1353v-655q103 -1 191.5 1.5t125.5 5.5l37 3q68 2 90.5 24.5t39.5 94.5l33 142h103l-14 -322l7 -319h-103l-29 127q-15 68 -45 93t-84 26q-87 8 -352 8v-556q0 -78 43.5 -115.5t133.5 -37.5h357q35 0 59.5 2t55 7.5t54 18t48.5 32t46 50.5t39 73l93 216h89
+q-6 -37 -31.5 -252t-30.5 -276q-146 5 -263.5 8t-162.5 4h-44h-628l-376 -12v102l127 25q67 13 91.5 37t25.5 79l8 643q3 402 -8 645q-2 61 -25.5 84t-91.5 36l-127 24v102l376 -12h702q139 0 374 27q-6 -68 -14 -194.5t-12 -219.5l-5 -92h-93l-32 124q-31 121 -74 179.5
+t-113 58.5h-548q-28 0 -35.5 -8.5t-7.5 -30.5z" />
+    <glyph glyph-name="uniF2D8" unicode="&#xf2d8;" 
+d="M922 739v-182q0 -4 0.5 -15t0 -15l-1.5 -12t-3.5 -11.5t-6.5 -7.5t-11 -5.5t-16 -1.5v309q9 0 16 -1t11 -5t6.5 -5.5t3.5 -9.5t1 -10.5v-13.5v-14zM1238 643v-121q0 -1 0.5 -12.5t0 -15.5t-2.5 -11.5t-7.5 -10.5t-13.5 -3q-9 0 -14 9q-4 10 -4 165v7v8.5v9t1.5 8.5l3.5 7
+t5 5.5t8 1.5q6 0 10 -1.5t6.5 -4.5t4 -6t2 -8.5t0.5 -8v-9.5v-9zM180 407h122v472h-122v-472zM614 407h106v472h-159l-28 -221q-20 148 -32 221h-158v-472h107v312l45 -312h76l43 319v-319zM1039 712q0 67 -5 90q-3 16 -11 28.5t-17 20.5t-25 14t-26.5 8.5t-31 4t-29 1.5
+h-29.5h-12h-91v-472h56q169 -1 197 24.5t25 180.5q-1 62 -1 100zM1356 515v133q0 29 -2 45t-9.5 33.5t-24.5 25t-46 7.5q-46 0 -77 -34v154h-117v-472h110l7 30q30 -36 77 -36q50 0 66 30.5t16 83.5zM1536 1248v-1216q0 -66 -47 -113t-113 -47h-1216q-66 0 -113 47t-47 113
+v1216q0 66 47 113t113 47h1216q66 0 113 -47t47 -113z" />
+    <glyph glyph-name="uniF2D9" unicode="&#xf2d9;" horiz-adv-x="2176" 
+d="M1143 -197q-6 1 -11 4q-13 8 -36 23t-86 65t-116.5 104.5t-112 140t-89.5 172.5q-17 3 -175 37q66 -213 235 -362t391 -184zM502 409l168 -28q-25 76 -41 167.5t-19 145.5l-4 53q-84 -82 -121 -224q5 -65 17 -114zM612 1018q-43 -64 -77 -148q44 46 74 68zM2049 584
+q0 161 -62 307t-167.5 252t-250.5 168.5t-304 62.5q-147 0 -281 -52.5t-240 -148.5q-30 -58 -45 -160q60 51 143 83.5t158.5 43t143 13.5t108.5 -1l40 -3q33 -1 53 -15.5t24.5 -33t6.5 -37t-1 -28.5q-126 11 -227.5 0.5t-183 -43.5t-142.5 -71.5t-131 -98.5
+q4 -36 11.5 -92.5t35.5 -178t62 -179.5q123 -6 247.5 14.5t214.5 53.5t162.5 67t109.5 59l37 24q22 16 39.5 20.5t30.5 -5t17 -34.5q14 -97 -39 -121q-208 -97 -467 -134q-135 -20 -317 -16q41 -96 110 -176.5t137 -127t130.5 -79t101.5 -43.5l39 -12q143 -23 263 15
+q195 99 314 289t119 418zM2123 621q-14 -135 -40 -212q-70 -208 -181.5 -346.5t-318.5 -253.5q-48 -33 -82 -44q-72 -26 -163 -16q-36 -3 -73 -3q-283 0 -504.5 173t-295.5 442q-1 0 -4 0.5t-5 0.5q-6 -50 2.5 -112.5t26 -115t36 -98t31.5 -71.5l14 -26q8 -12 54 -82
+q-71 38 -124.5 106.5t-78.5 140t-39.5 137t-17.5 107.5l-2 42q-5 2 -33.5 12.5t-48.5 18t-53 20.5t-57.5 25t-50 25.5t-42.5 27t-25 25.5q19 -10 50.5 -25.5t113 -45.5t145.5 -38l2 32q11 149 94 290q41 202 176 365q28 115 81 214q15 28 32 45t49 32q158 74 303.5 104
+t302 11t306.5 -97q220 -115 333 -336t87 -474z" />
+    <glyph glyph-name="uniF2DA" unicode="&#xf2da;" horiz-adv-x="1792" 
+d="M1341 752q29 44 -6.5 129.5t-121.5 142.5q-58 39 -125.5 53.5t-118 4.5t-68.5 -37q-12 -23 -4.5 -28t42.5 -10q23 -3 38.5 -5t44.5 -9.5t56 -17.5q36 -13 67.5 -31.5t53 -37t40 -38.5t30.5 -38t22 -34.5t16.5 -28.5t12 -18.5t10.5 -6t11 9.5zM1704 178
+q-52 -127 -148.5 -220t-214.5 -141.5t-253 -60.5t-266 13.5t-251 91t-210 161.5t-141.5 235.5t-46.5 303.5q1 41 8.5 84.5t12.5 64t24 80.5t23 73q-51 -208 1 -397t173 -318t291 -206t346 -83t349 74.5t289 244.5q20 27 18 14q0 -4 -4 -14zM1465 627q0 -104 -40.5 -199
+t-108.5 -164t-162 -109.5t-198 -40.5t-198 40.5t-162 109.5t-108.5 164t-40.5 199t40.5 199t108.5 164t162 109.5t198 40.5t198 -40.5t162 -109.5t108.5 -164t40.5 -199zM1752 915q-65 147 -180.5 251t-253 153.5t-292 53.5t-301 -36.5t-275.5 -129t-220 -211.5t-131 -297
+t-10 -373q-49 161 -51.5 311.5t35.5 272.5t109 227t165.5 180.5t207 126t232 71t242.5 9t236 -54t216 -124.5t178 -197q33 -50 62 -121t31 -112zM1690 573q12 244 -136.5 416t-396.5 240q-8 0 -10 5t24 8q125 -4 230 -50t173 -120t116 -168.5t58.5 -199t-1 -208
+t-61.5 -197.5t-122.5 -167t-185 -117.5t-248.5 -46.5q108 30 201.5 80t174 123t129.5 176.5t55 225.5z" />
+    <glyph glyph-name="uniF2DB" unicode="&#xf2db;" 
+d="M192 256v-128h-112q-16 0 -16 16v16h-48q-16 0 -16 16v32q0 16 16 16h48v16q0 16 16 16h112zM192 512v-128h-112q-16 0 -16 16v16h-48q-16 0 -16 16v32q0 16 16 16h48v16q0 16 16 16h112zM192 768v-128h-112q-16 0 -16 16v16h-48q-16 0 -16 16v32q0 16 16 16h48v16
+q0 16 16 16h112zM192 1024v-128h-112q-16 0 -16 16v16h-48q-16 0 -16 16v32q0 16 16 16h48v16q0 16 16 16h112zM192 1280v-128h-112q-16 0 -16 16v16h-48q-16 0 -16 16v32q0 16 16 16h48v16q0 16 16 16h112zM1280 1440v-1472q0 -40 -28 -68t-68 -28h-832q-40 0 -68 28
+t-28 68v1472q0 40 28 68t68 28h832q40 0 68 -28t28 -68zM1536 208v-32q0 -16 -16 -16h-48v-16q0 -16 -16 -16h-112v128h112q16 0 16 -16v-16h48q16 0 16 -16zM1536 464v-32q0 -16 -16 -16h-48v-16q0 -16 -16 -16h-112v128h112q16 0 16 -16v-16h48q16 0 16 -16zM1536 720v-32
+q0 -16 -16 -16h-48v-16q0 -16 -16 -16h-112v128h112q16 0 16 -16v-16h48q16 0 16 -16zM1536 976v-32q0 -16 -16 -16h-48v-16q0 -16 -16 -16h-112v128h112q16 0 16 -16v-16h48q16 0 16 -16zM1536 1232v-32q0 -16 -16 -16h-48v-16q0 -16 -16 -16h-112v128h112q16 0 16 -16v-16
+h48q16 0 16 -16z" />
+    <glyph glyph-name="uniF2DC" unicode="&#xf2dc;" horiz-adv-x="1664" 
+d="M1566 419l-167 -33l186 -107q23 -13 29.5 -38.5t-6.5 -48.5q-14 -23 -39 -29.5t-48 6.5l-186 106l55 -160q13 -38 -12 -63.5t-60.5 -20.5t-48.5 42l-102 300l-271 156v-313l208 -238q16 -18 17 -39t-11 -36.5t-28.5 -25t-37 -5.5t-36.5 22l-112 128v-214q0 -26 -19 -45
+t-45 -19t-45 19t-19 45v214l-112 -128q-16 -18 -36.5 -22t-37 5.5t-28.5 25t-11 36.5t17 39l208 238v313l-271 -156l-102 -300q-13 -37 -48.5 -42t-60.5 20.5t-12 63.5l55 160l-186 -106q-23 -13 -48 -6.5t-39 29.5q-13 23 -6.5 48.5t29.5 38.5l186 107l-167 33
+q-29 6 -42 29t-8.5 46.5t25.5 40t50 10.5l310 -62l271 157l-271 157l-310 -62q-4 -1 -13 -1q-27 0 -44 18t-19 40t11 43t40 26l167 33l-186 107q-23 13 -29.5 38.5t6.5 48.5t39 30t48 -7l186 -106l-55 160q-13 38 12 63.5t60.5 20.5t48.5 -42l102 -300l271 -156v313
+l-208 238q-16 18 -17 39t11 36.5t28.5 25t37 5.5t36.5 -22l112 -128v214q0 26 19 45t45 19t45 -19t19 -45v-214l112 128q16 18 36.5 22t37 -5.5t28.5 -25t11 -36.5t-17 -39l-208 -238v-313l271 156l102 300q13 37 48.5 42t60.5 -20.5t12 -63.5l-55 -160l186 106
+q23 13 48 6.5t39 -29.5q13 -23 6.5 -48.5t-29.5 -38.5l-186 -107l167 -33q27 -5 40 -26t11 -43t-19 -40t-44 -18q-9 0 -13 1l-310 62l-271 -157l271 -157l310 62q29 6 50 -10.5t25.5 -40t-8.5 -46.5t-42 -29z" />
+    <glyph glyph-name="uniF2DD" unicode="&#xf2dd;" horiz-adv-x="1792" 
+d="M1473 607q7 118 -33 226.5t-113 189t-177 131t-221 57.5q-116 7 -225.5 -32t-192 -110.5t-135 -175t-59.5 -220.5q-7 -118 33 -226.5t113 -189t177.5 -131t221.5 -57.5q155 -9 293 59t224 195.5t94 283.5zM1792 1536l-349 -348q120 -117 180.5 -272t50.5 -321
+q-11 -183 -102 -339t-241 -255.5t-332 -124.5l-999 -132l347 347q-120 116 -180.5 271.5t-50.5 321.5q11 184 102 340t241.5 255.5t332.5 124.5q167 22 500 66t500 66z" />
+    <glyph glyph-name="uniF2DE" unicode="&#xf2de;" horiz-adv-x="1792" 
+d="M948 508l163 -329h-51l-175 350l-171 -350h-49l179 374l-78 33l21 49l240 -102l-21 -50zM563 1100l304 -130l-130 -304l-304 130zM907 915l240 -103l-103 -239l-239 102zM1188 765l191 -81l-82 -190l-190 81zM1680 640q0 159 -62 304t-167.5 250.5t-250.5 167.5t-304 62
+t-304 -62t-250.5 -167.5t-167.5 -250.5t-62 -304t62 -304t167.5 -250.5t250.5 -167.5t304 -62t304 62t250.5 167.5t167.5 250.5t62 304zM1792 640q0 -182 -71 -348t-191 -286t-286 -191t-348 -71t-348 71t-286 191t-191 286t-71 348t71 348t191 286t286 191t348 71t348 -71
+t286 -191t191 -286t71 -348z" />
+    <glyph glyph-name="uniF2E0" unicode="&#xf2e0;" horiz-adv-x="1920" 
+d="M1334 302q-4 24 -27.5 34t-49.5 10.5t-48.5 12.5t-25.5 38q-5 47 33 139.5t75 181t32 127.5q-14 101 -117 103q-45 1 -75 -16l-3 -2l-5 -2.5t-4.5 -2t-5 -2t-5 -0.5t-6 1.5t-6 3.5t-6.5 5q-3 2 -9 8.5t-9 9t-8.5 7.5t-9.5 7.5t-9.5 5.5t-11 4.5t-11.5 2.5q-30 5 -48 -3
+t-45 -31q-1 -1 -9 -8.5t-12.5 -11t-15 -10t-16.5 -5.5t-17 3q-54 27 -84 40q-41 18 -94 -5t-76 -65q-16 -28 -41 -98.5t-43.5 -132.5t-40 -134t-21.5 -73q-22 -69 18.5 -119t110.5 -46q30 2 50.5 15t38.5 46q7 13 79 199.5t77 194.5q6 11 21.5 18t29.5 0q27 -15 21 -53
+q-2 -18 -51 -139.5t-50 -132.5q-6 -38 19.5 -56.5t60.5 -7t55 49.5q4 8 45.5 92t81.5 163.5t46 88.5q20 29 41 28q29 0 25 -38q-2 -16 -65.5 -147.5t-70.5 -159.5q-12 -53 13 -103t74 -74q17 -9 51 -15.5t71.5 -8t62.5 14t20 48.5zM383 86q3 -15 -5 -27.5t-23 -15.5
+q-14 -3 -26.5 5t-15.5 23q-3 14 5 27t22 16t27 -5t16 -23zM953 -177q12 -17 8.5 -37.5t-20.5 -32.5t-37.5 -8t-32.5 21q-11 17 -7.5 37.5t20.5 32.5t37.5 8t31.5 -21zM177 635q-18 -27 -49.5 -33t-57.5 13q-26 18 -32 50t12 58q18 27 49.5 33t57.5 -12q26 -19 32 -50.5
+t-12 -58.5zM1467 -42q19 -28 13 -61.5t-34 -52.5t-60.5 -13t-51.5 34t-13 61t33 53q28 19 60.5 13t52.5 -34zM1579 562q69 -113 42.5 -244.5t-134.5 -207.5q-90 -63 -199 -60q-20 -80 -84.5 -127t-143.5 -44.5t-140 57.5q-12 -9 -13 -10q-103 -71 -225 -48.5t-193 126.5
+q-50 73 -53 164q-83 14 -142.5 70.5t-80.5 128t-2 152t81 138.5q-36 60 -38 128t24.5 125t79.5 98.5t121 50.5q32 85 99 148t146.5 91.5t168 17t159.5 -66.5q72 21 140 17.5t128.5 -36t104.5 -80t67.5 -115t17.5 -140.5q52 -16 87 -57t45.5 -89t-5.5 -99.5t-58 -87.5z
+M455 1222q14 -20 9.5 -44.5t-24.5 -38.5q-19 -14 -43.5 -9.5t-37.5 24.5q-14 20 -9.5 44.5t24.5 38.5q19 14 43.5 9.5t37.5 -24.5zM614 1503q4 -16 -5 -30.5t-26 -18.5t-31 5.5t-18 26.5q-3 17 6.5 31t25.5 18q17 4 31 -5.5t17 -26.5zM1800 555q4 -20 -6.5 -37t-30.5 -21
+q-19 -4 -36 6.5t-21 30.5t6.5 37t30.5 22q20 4 36.5 -7.5t20.5 -30.5zM1136 1448q16 -27 8.5 -58.5t-35.5 -47.5q-27 -16 -57.5 -8.5t-46.5 34.5q-16 28 -8.5 59t34.5 48t58 9t47 -36zM1882 792q4 -15 -4 -27.5t-23 -16.5q-15 -3 -27.5 5.5t-15.5 22.5q-3 15 5 28t23 16
+q14 3 26.5 -5t15.5 -23zM1691 1033q15 -22 10.5 -49t-26.5 -43q-22 -15 -49 -10t-42 27t-10 49t27 43t48.5 11t41.5 -28z" />
+    <glyph glyph-name="uniF2E1" unicode="&#xf2e1;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E2" unicode="&#xf2e2;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E3" unicode="&#xf2e3;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E4" unicode="&#xf2e4;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E5" unicode="&#xf2e5;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E6" unicode="&#xf2e6;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E7" unicode="&#xf2e7;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="_698" unicode="&#xf2e8;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2E9" unicode="&#xf2e9;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2EA" unicode="&#xf2ea;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2EB" unicode="&#xf2eb;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2EC" unicode="&#xf2ec;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2ED" unicode="&#xf2ed;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="uniF2EE" unicode="&#xf2ee;" horiz-adv-x="1792" 
+ />
+    <glyph glyph-name="lessequal" unicode="&#xf500;" horiz-adv-x="1792" 
+ />
+  </font>
+</defs></svg>
diff --git a/plugins/fontawesome/fonts/fontawesome-webfont.ttf b/plugins/fontawesome/fonts/fontawesome-webfont.ttf
new file mode 100644
index 00000000..35acda2f
Binary files /dev/null and b/plugins/fontawesome/fonts/fontawesome-webfont.ttf differ
diff --git a/plugins/fontawesome/fonts/fontawesome-webfont.woff b/plugins/fontawesome/fonts/fontawesome-webfont.woff
new file mode 100644
index 00000000..400014a4
Binary files /dev/null and b/plugins/fontawesome/fonts/fontawesome-webfont.woff differ
diff --git a/plugins/fontawesome/fonts/fontawesome-webfont.woff2 b/plugins/fontawesome/fonts/fontawesome-webfont.woff2
new file mode 100644
index 00000000..4d13fc60
Binary files /dev/null and b/plugins/fontawesome/fonts/fontawesome-webfont.woff2 differ
diff --git a/plugins/google-map/gmap.js b/plugins/google-map/gmap.js
new file mode 100644
index 00000000..d7c9e98e
--- /dev/null
+++ b/plugins/google-map/gmap.js
@@ -0,0 +1,80 @@
+window.marker = null;
+
+function initialize() {
+  var map;
+  var latitude = $('#map_canvas').attr('data-latitude');
+  var longitude = $('#map_canvas').attr('data-longitude');
+  var mapMarker = $('#map_canvas').attr('data-marker');
+  var mapMarkerName = $('#map_canvas').attr('data-marker-name');
+  var nottingham = new google.maps.LatLng(latitude, longitude);
+  var style = [{
+      "featureType": "road",
+      "elementType": "geometry",
+      "stylers": [{
+          "lightness": 100
+        },
+        {
+          "visibility": "simplified"
+        }
+      ]
+    },
+    {
+      "featureType": "water",
+      "elementType": "geometry",
+      "stylers": [{
+          "visibility": "on"
+        },
+        {
+          "color": "#C6E2FF"
+        }
+      ]
+    },
+    {
+      "featureType": "poi",
+      "elementType": "geometry.fill",
+      "stylers": [{
+        "color": "#C5E3BF"
+      }]
+    },
+    {
+      "featureType": "road",
+      "elementType": "geometry.fill",
+      "stylers": [{
+        "color": "#D1D1B8"
+      }]
+    }
+  ];
+  var mapOptions = {
+    center: nottingham,
+    mapTypeId: google.maps.MapTypeId.ROADMAP,
+    backgroundColor: "#000",
+    zoom: 15,
+    panControl: false,
+    zoomControl: true,
+    mapTypeControl: false,
+    scaleControl: false,
+    streetViewControl: false,
+    overviewMapControl: false,
+    zoomControlOptions: {
+      style: google.maps.ZoomControlStyle.LARGE
+    }
+  }
+  map = new google.maps.Map(document.getElementById('map_canvas'), mapOptions);
+  var mapType = new google.maps.StyledMapType(style, {
+    name: "Grayscale"
+  });
+  map.mapTypes.set('grey', mapType);
+  map.setMapTypeId('grey');
+  var marker_image = mapMarker;
+  var pinIcon = new google.maps.MarkerImage(marker_image, null, null, null, new google.maps.Size(46, 58));
+  marker = new google.maps.Marker({
+    position: nottingham,
+    map: map,
+    icon: pinIcon,
+    title: mapMarkerName
+  });
+}
+var map = document.getElementById('map_canvas');
+if (map != null) {
+  google.maps.event.addDomListener(window, 'load', initialize);
+}
\ No newline at end of file
diff --git a/plugins/jQuery/jquery.min.js b/plugins/jQuery/jquery.min.js
new file mode 100644
index 00000000..a967467b
--- /dev/null
+++ b/plugins/jQuery/jquery.min.js
@@ -0,0 +1,2 @@
+/*! jQuery v3.3.1 | (c) JS Foundation and other contributors | jquery.org/license */
+!function (e, t) { "use strict"; "object" == typeof module && "object" == typeof module.exports ? module.exports = e.document ? t(e, !0) : function (e) { if (!e.document) throw new Error("jQuery requires a window with a document"); return t(e) } : t(e) }("undefined" != typeof window ? window : this, function (e, t) { "use strict"; var n = [], r = e.document, i = Object.getPrototypeOf, o = n.slice, a = n.concat, s = n.push, u = n.indexOf, l = {}, c = l.toString, f = l.hasOwnProperty, p = f.toString, d = p.call(Object), h = {}, g = function e(t) { return "function" == typeof t && "number" != typeof t.nodeType }, y = function e(t) { return null != t && t === t.window }, v = { type: !0, src: !0, noModule: !0 }; function m(e, t, n) { var i, o = (t = t || r).createElement("script"); if (o.text = e, n) for (i in v) n[i] && (o[i] = n[i]); t.head.appendChild(o).parentNode.removeChild(o) } function x(e) { return null == e ? e + "" : "object" == typeof e || "function" == typeof e ? l[c.call(e)] || "object" : typeof e } var b = "3.3.1", w = function (e, t) { return new w.fn.init(e, t) }, T = /^[\s\uFEFF\xA0]+|[\s\uFEFF\xA0]+$/g; w.fn = w.prototype = { jquery: "3.3.1", constructor: w, length: 0, toArray: function () { return o.call(this) }, get: function (e) { return null == e ? o.call(this) : e < 0 ? this[e + this.length] : this[e] }, pushStack: function (e) { var t = w.merge(this.constructor(), e); return t.prevObject = this, t }, each: function (e) { return w.each(this, e) }, map: function (e) { return this.pushStack(w.map(this, function (t, n) { return e.call(t, n, t) })) }, slice: function () { return this.pushStack(o.apply(this, arguments)) }, first: function () { return this.eq(0) }, last: function () { return this.eq(-1) }, eq: function (e) { var t = this.length, n = +e + (e < 0 ? t : 0); return this.pushStack(n >= 0 && n < t ? [this[n]] : []) }, end: function () { return this.prevObject || this.constructor() }, push: s, sort: n.sort, splice: n.splice }, w.extend = w.fn.extend = function () { var e, t, n, r, i, o, a = arguments[0] || {}, s = 1, u = arguments.length, l = !1; for ("boolean" == typeof a && (l = a, a = arguments[s] || {}, s++), "object" == typeof a || g(a) || (a = {}), s === u && (a = this, s--); s < u; s++)if (null != (e = arguments[s])) for (t in e) n = a[t], a !== (r = e[t]) && (l && r && (w.isPlainObject(r) || (i = Array.isArray(r))) ? (i ? (i = !1, o = n && Array.isArray(n) ? n : []) : o = n && w.isPlainObject(n) ? n : {}, a[t] = w.extend(l, o, r)) : void 0 !== r && (a[t] = r)); return a }, w.extend({ expando: "jQuery" + ("3.3.1" + Math.random()).replace(/\D/g, ""), isReady: !0, error: function (e) { throw new Error(e) }, noop: function () { }, isPlainObject: function (e) { var t, n; return !(!e || "[object Object]" !== c.call(e)) && (!(t = i(e)) || "function" == typeof (n = f.call(t, "constructor") && t.constructor) && p.call(n) === d) }, isEmptyObject: function (e) { var t; for (t in e) return !1; return !0 }, globalEval: function (e) { m(e) }, each: function (e, t) { var n, r = 0; if (C(e)) { for (n = e.length; r < n; r++)if (!1 === t.call(e[r], r, e[r])) break } else for (r in e) if (!1 === t.call(e[r], r, e[r])) break; return e }, trim: function (e) { return null == e ? "" : (e + "").replace(T, "") }, makeArray: function (e, t) { var n = t || []; return null != e && (C(Object(e)) ? w.merge(n, "string" == typeof e ? [e] : e) : s.call(n, e)), n }, inArray: function (e, t, n) { return null == t ? -1 : u.call(t, e, n) }, merge: function (e, t) { for (var n = +t.length, r = 0, i = e.length; r < n; r++)e[i++] = t[r]; return e.length = i, e }, grep: function (e, t, n) { for (var r, i = [], o = 0, a = e.length, s = !n; o < a; o++)(r = !t(e[o], o)) !== s && i.push(e[o]); return i }, map: function (e, t, n) { var r, i, o = 0, s = []; if (C(e)) for (r = e.length; o < r; o++)null != (i = t(e[o], o, n)) && s.push(i); else for (o in e) null != (i = t(e[o], o, n)) && s.push(i); return a.apply([], s) }, guid: 1, support: h }), "function" == typeof Symbol && (w.fn[Symbol.iterator] = n[Symbol.iterator]), w.each("Boolean Number String Function Array Date RegExp Object Error Symbol".split(" "), function (e, t) { l["[object " + t + "]"] = t.toLowerCase() }); function C(e) { var t = !!e && "length" in e && e.length, n = x(e); return !g(e) && !y(e) && ("array" === n || 0 === t || "number" == typeof t && t > 0 && t - 1 in e) } var E = function (e) { var t, n, r, i, o, a, s, u, l, c, f, p, d, h, g, y, v, m, x, b = "sizzle" + 1 * new Date, w = e.document, T = 0, C = 0, E = ae(), k = ae(), S = ae(), D = function (e, t) { return e === t && (f = !0), 0 }, N = {}.hasOwnProperty, A = [], j = A.pop, q = A.push, L = A.push, H = A.slice, O = function (e, t) { for (var n = 0, r = e.length; n < r; n++)if (e[n] === t) return n; return -1 }, P = "checked|selected|async|autofocus|autoplay|controls|defer|disabled|hidden|ismap|loop|multiple|open|readonly|required|scoped", M = "[\\x20\\t\\r\\n\\f]", R = "(?:\\\\.|[\\w-]|[^\0-\\xa0])+", I = "\\[" + M + "*(" + R + ")(?:" + M + "*([*^$|!~]?=)" + M + "*(?:'((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\"|(" + R + "))|)" + M + "*\\]", W = ":(" + R + ")(?:\\((('((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\")|((?:\\\\.|[^\\\\()[\\]]|" + I + ")*)|.*)\\)|)", $ = new RegExp(M + "+", "g"), B = new RegExp("^" + M + "+|((?:^|[^\\\\])(?:\\\\.)*)" + M + "+$", "g"), F = new RegExp("^" + M + "*," + M + "*"), _ = new RegExp("^" + M + "*([>+~]|" + M + ")" + M + "*"), z = new RegExp("=" + M + "*([^\\]'\"]*?)" + M + "*\\]", "g"), X = new RegExp(W), U = new RegExp("^" + R + "$"), V = { ID: new RegExp("^#(" + R + ")"), CLASS: new RegExp("^\\.(" + R + ")"), TAG: new RegExp("^(" + R + "|[*])"), ATTR: new RegExp("^" + I), PSEUDO: new RegExp("^" + W), CHILD: new RegExp("^:(only|first|last|nth|nth-last)-(child|of-type)(?:\\(" + M + "*(even|odd|(([+-]|)(\\d*)n|)" + M + "*(?:([+-]|)" + M + "*(\\d+)|))" + M + "*\\)|)", "i"), bool: new RegExp("^(?:" + P + ")$", "i"), needsContext: new RegExp("^" + M + "*[>+~]|:(even|odd|eq|gt|lt|nth|first|last)(?:\\(" + M + "*((?:-\\d)?\\d*)" + M + "*\\)|)(?=[^-]|$)", "i") }, G = /^(?:input|select|textarea|button)$/i, Y = /^h\d$/i, Q = /^[^{]+\{\s*\[native \w/, J = /^(?:#([\w-]+)|(\w+)|\.([\w-]+))$/, K = /[+~]/, Z = new RegExp("\\\\([\\da-f]{1,6}" + M + "?|(" + M + ")|.)", "ig"), ee = function (e, t, n) { var r = "0x" + t - 65536; return r !== r || n ? t : r < 0 ? String.fromCharCode(r + 65536) : String.fromCharCode(r >> 10 | 55296, 1023 & r | 56320) }, te = /([\0-\x1f\x7f]|^-?\d)|^-$|[^\0-\x1f\x7f-\uFFFF\w-]/g, ne = function (e, t) { return t ? "\0" === e ? "\ufffd" : e.slice(0, -1) + "\\" + e.charCodeAt(e.length - 1).toString(16) + " " : "\\" + e }, re = function () { p() }, ie = me(function (e) { return !0 === e.disabled && ("form" in e || "label" in e) }, { dir: "parentNode", next: "legend" }); try { L.apply(A = H.call(w.childNodes), w.childNodes), A[w.childNodes.length].nodeType } catch (e) { L = { apply: A.length ? function (e, t) { q.apply(e, H.call(t)) } : function (e, t) { var n = e.length, r = 0; while (e[n++] = t[r++]); e.length = n - 1 } } } function oe(e, t, r, i) { var o, s, l, c, f, h, v, m = t && t.ownerDocument, T = t ? t.nodeType : 9; if (r = r || [], "string" != typeof e || !e || 1 !== T && 9 !== T && 11 !== T) return r; if (!i && ((t ? t.ownerDocument || t : w) !== d && p(t), t = t || d, g)) { if (11 !== T && (f = J.exec(e))) if (o = f[1]) { if (9 === T) { if (!(l = t.getElementById(o))) return r; if (l.id === o) return r.push(l), r } else if (m && (l = m.getElementById(o)) && x(t, l) && l.id === o) return r.push(l), r } else { if (f[2]) return L.apply(r, t.getElementsByTagName(e)), r; if ((o = f[3]) && n.getElementsByClassName && t.getElementsByClassName) return L.apply(r, t.getElementsByClassName(o)), r } if (n.qsa && !S[e + " "] && (!y || !y.test(e))) { if (1 !== T) m = t, v = e; else if ("object" !== t.nodeName.toLowerCase()) { (c = t.getAttribute("id")) ? c = c.replace(te, ne) : t.setAttribute("id", c = b), s = (h = a(e)).length; while (s--) h[s] = "#" + c + " " + ve(h[s]); v = h.join(","), m = K.test(e) && ge(t.parentNode) || t } if (v) try { return L.apply(r, m.querySelectorAll(v)), r } catch (e) { } finally { c === b && t.removeAttribute("id") } } } return u(e.replace(B, "$1"), t, r, i) } function ae() { var e = []; function t(n, i) { return e.push(n + " ") > r.cacheLength && delete t[e.shift()], t[n + " "] = i } return t } function se(e) { return e[b] = !0, e } function ue(e) { var t = d.createElement("fieldset"); try { return !!e(t) } catch (e) { return !1 } finally { t.parentNode && t.parentNode.removeChild(t), t = null } } function le(e, t) { var n = e.split("|"), i = n.length; while (i--) r.attrHandle[n[i]] = t } function ce(e, t) { var n = t && e, r = n && 1 === e.nodeType && 1 === t.nodeType && e.sourceIndex - t.sourceIndex; if (r) return r; if (n) while (n = n.nextSibling) if (n === t) return -1; return e ? 1 : -1 } function fe(e) { return function (t) { return "input" === t.nodeName.toLowerCase() && t.type === e } } function pe(e) { return function (t) { var n = t.nodeName.toLowerCase(); return ("input" === n || "button" === n) && t.type === e } } function de(e) { return function (t) { return "form" in t ? t.parentNode && !1 === t.disabled ? "label" in t ? "label" in t.parentNode ? t.parentNode.disabled === e : t.disabled === e : t.isDisabled === e || t.isDisabled !== !e && ie(t) === e : t.disabled === e : "label" in t && t.disabled === e } } function he(e) { return se(function (t) { return t = +t, se(function (n, r) { var i, o = e([], n.length, t), a = o.length; while (a--) n[i = o[a]] && (n[i] = !(r[i] = n[i])) }) }) } function ge(e) { return e && "undefined" != typeof e.getElementsByTagName && e } n = oe.support = {}, o = oe.isXML = function (e) { var t = e && (e.ownerDocument || e).documentElement; return !!t && "HTML" !== t.nodeName }, p = oe.setDocument = function (e) { var t, i, a = e ? e.ownerDocument || e : w; return a !== d && 9 === a.nodeType && a.documentElement ? (d = a, h = d.documentElement, g = !o(d), w !== d && (i = d.defaultView) && i.top !== i && (i.addEventListener ? i.addEventListener("unload", re, !1) : i.attachEvent && i.attachEvent("onunload", re)), n.attributes = ue(function (e) { return e.className = "i", !e.getAttribute("className") }), n.getElementsByTagName = ue(function (e) { return e.appendChild(d.createComment("")), !e.getElementsByTagName("*").length }), n.getElementsByClassName = Q.test(d.getElementsByClassName), n.getById = ue(function (e) { return h.appendChild(e).id = b, !d.getElementsByName || !d.getElementsByName(b).length }), n.getById ? (r.filter.ID = function (e) { var t = e.replace(Z, ee); return function (e) { return e.getAttribute("id") === t } }, r.find.ID = function (e, t) { if ("undefined" != typeof t.getElementById && g) { var n = t.getElementById(e); return n ? [n] : [] } }) : (r.filter.ID = function (e) { var t = e.replace(Z, ee); return function (e) { var n = "undefined" != typeof e.getAttributeNode && e.getAttributeNode("id"); return n && n.value === t } }, r.find.ID = function (e, t) { if ("undefined" != typeof t.getElementById && g) { var n, r, i, o = t.getElementById(e); if (o) { if ((n = o.getAttributeNode("id")) && n.value === e) return [o]; i = t.getElementsByName(e), r = 0; while (o = i[r++]) if ((n = o.getAttributeNode("id")) && n.value === e) return [o] } return [] } }), r.find.TAG = n.getElementsByTagName ? function (e, t) { return "undefined" != typeof t.getElementsByTagName ? t.getElementsByTagName(e) : n.qsa ? t.querySelectorAll(e) : void 0 } : function (e, t) { var n, r = [], i = 0, o = t.getElementsByTagName(e); if ("*" === e) { while (n = o[i++]) 1 === n.nodeType && r.push(n); return r } return o }, r.find.CLASS = n.getElementsByClassName && function (e, t) { if ("undefined" != typeof t.getElementsByClassName && g) return t.getElementsByClassName(e) }, v = [], y = [], (n.qsa = Q.test(d.querySelectorAll)) && (ue(function (e) { h.appendChild(e).innerHTML = "<a id='" + b + "'></a><select id='" + b + "-\r\\' msallowcapture=''><option selected=''></option></select>", e.querySelectorAll("[msallowcapture^='']").length && y.push("[*^$]=" + M + "*(?:''|\"\")"), e.querySelectorAll("[selected]").length || y.push("\\[" + M + "*(?:value|" + P + ")"), e.querySelectorAll("[id~=" + b + "-]").length || y.push("~="), e.querySelectorAll(":checked").length || y.push(":checked"), e.querySelectorAll("a#" + b + "+*").length || y.push(".#.+[+~]") }), ue(function (e) { e.innerHTML = "<a href='' disabled='disabled'></a><select disabled='disabled'><option/></select>"; var t = d.createElement("input"); t.setAttribute("type", "hidden"), e.appendChild(t).setAttribute("name", "D"), e.querySelectorAll("[name=d]").length && y.push("name" + M + "*[*^$|!~]?="), 2 !== e.querySelectorAll(":enabled").length && y.push(":enabled", ":disabled"), h.appendChild(e).disabled = !0, 2 !== e.querySelectorAll(":disabled").length && y.push(":enabled", ":disabled"), e.querySelectorAll("*,:x"), y.push(",.*:") })), (n.matchesSelector = Q.test(m = h.matches || h.webkitMatchesSelector || h.mozMatchesSelector || h.oMatchesSelector || h.msMatchesSelector)) && ue(function (e) { n.disconnectedMatch = m.call(e, "*"), m.call(e, "[s!='']:x"), v.push("!=", W) }), y = y.length && new RegExp(y.join("|")), v = v.length && new RegExp(v.join("|")), t = Q.test(h.compareDocumentPosition), x = t || Q.test(h.contains) ? function (e, t) { var n = 9 === e.nodeType ? e.documentElement : e, r = t && t.parentNode; return e === r || !(!r || 1 !== r.nodeType || !(n.contains ? n.contains(r) : e.compareDocumentPosition && 16 & e.compareDocumentPosition(r))) } : function (e, t) { if (t) while (t = t.parentNode) if (t === e) return !0; return !1 }, D = t ? function (e, t) { if (e === t) return f = !0, 0; var r = !e.compareDocumentPosition - !t.compareDocumentPosition; return r || (1 & (r = (e.ownerDocument || e) === (t.ownerDocument || t) ? e.compareDocumentPosition(t) : 1) || !n.sortDetached && t.compareDocumentPosition(e) === r ? e === d || e.ownerDocument === w && x(w, e) ? -1 : t === d || t.ownerDocument === w && x(w, t) ? 1 : c ? O(c, e) - O(c, t) : 0 : 4 & r ? -1 : 1) } : function (e, t) { if (e === t) return f = !0, 0; var n, r = 0, i = e.parentNode, o = t.parentNode, a = [e], s = [t]; if (!i || !o) return e === d ? -1 : t === d ? 1 : i ? -1 : o ? 1 : c ? O(c, e) - O(c, t) : 0; if (i === o) return ce(e, t); n = e; while (n = n.parentNode) a.unshift(n); n = t; while (n = n.parentNode) s.unshift(n); while (a[r] === s[r]) r++; return r ? ce(a[r], s[r]) : a[r] === w ? -1 : s[r] === w ? 1 : 0 }, d) : d }, oe.matches = function (e, t) { return oe(e, null, null, t) }, oe.matchesSelector = function (e, t) { if ((e.ownerDocument || e) !== d && p(e), t = t.replace(z, "='$1']"), n.matchesSelector && g && !S[t + " "] && (!v || !v.test(t)) && (!y || !y.test(t))) try { var r = m.call(e, t); if (r || n.disconnectedMatch || e.document && 11 !== e.document.nodeType) return r } catch (e) { } return oe(t, d, null, [e]).length > 0 }, oe.contains = function (e, t) { return (e.ownerDocument || e) !== d && p(e), x(e, t) }, oe.attr = function (e, t) { (e.ownerDocument || e) !== d && p(e); var i = r.attrHandle[t.toLowerCase()], o = i && N.call(r.attrHandle, t.toLowerCase()) ? i(e, t, !g) : void 0; return void 0 !== o ? o : n.attributes || !g ? e.getAttribute(t) : (o = e.getAttributeNode(t)) && o.specified ? o.value : null }, oe.escape = function (e) { return (e + "").replace(te, ne) }, oe.error = function (e) { throw new Error("Syntax error, unrecognized expression: " + e) }, oe.uniqueSort = function (e) { var t, r = [], i = 0, o = 0; if (f = !n.detectDuplicates, c = !n.sortStable && e.slice(0), e.sort(D), f) { while (t = e[o++]) t === e[o] && (i = r.push(o)); while (i--) e.splice(r[i], 1) } return c = null, e }, i = oe.getText = function (e) { var t, n = "", r = 0, o = e.nodeType; if (o) { if (1 === o || 9 === o || 11 === o) { if ("string" == typeof e.textContent) return e.textContent; for (e = e.firstChild; e; e = e.nextSibling)n += i(e) } else if (3 === o || 4 === o) return e.nodeValue } else while (t = e[r++]) n += i(t); return n }, (r = oe.selectors = { cacheLength: 50, createPseudo: se, match: V, attrHandle: {}, find: {}, relative: { ">": { dir: "parentNode", first: !0 }, " ": { dir: "parentNode" }, "+": { dir: "previousSibling", first: !0 }, "~": { dir: "previousSibling" } }, preFilter: { ATTR: function (e) { return e[1] = e[1].replace(Z, ee), e[3] = (e[3] || e[4] || e[5] || "").replace(Z, ee), "~=" === e[2] && (e[3] = " " + e[3] + " "), e.slice(0, 4) }, CHILD: function (e) { return e[1] = e[1].toLowerCase(), "nth" === e[1].slice(0, 3) ? (e[3] || oe.error(e[0]), e[4] = +(e[4] ? e[5] + (e[6] || 1) : 2 * ("even" === e[3] || "odd" === e[3])), e[5] = +(e[7] + e[8] || "odd" === e[3])) : e[3] && oe.error(e[0]), e }, PSEUDO: function (e) { var t, n = !e[6] && e[2]; return V.CHILD.test(e[0]) ? null : (e[3] ? e[2] = e[4] || e[5] || "" : n && X.test(n) && (t = a(n, !0)) && (t = n.indexOf(")", n.length - t) - n.length) && (e[0] = e[0].slice(0, t), e[2] = n.slice(0, t)), e.slice(0, 3)) } }, filter: { TAG: function (e) { var t = e.replace(Z, ee).toLowerCase(); return "*" === e ? function () { return !0 } : function (e) { return e.nodeName && e.nodeName.toLowerCase() === t } }, CLASS: function (e) { var t = E[e + " "]; return t || (t = new RegExp("(^|" + M + ")" + e + "(" + M + "|$)")) && E(e, function (e) { return t.test("string" == typeof e.className && e.className || "undefined" != typeof e.getAttribute && e.getAttribute("class") || "") }) }, ATTR: function (e, t, n) { return function (r) { var i = oe.attr(r, e); return null == i ? "!=" === t : !t || (i += "", "=" === t ? i === n : "!=" === t ? i !== n : "^=" === t ? n && 0 === i.indexOf(n) : "*=" === t ? n && i.indexOf(n) > -1 : "$=" === t ? n && i.slice(-n.length) === n : "~=" === t ? (" " + i.replace($, " ") + " ").indexOf(n) > -1 : "|=" === t && (i === n || i.slice(0, n.length + 1) === n + "-")) } }, CHILD: function (e, t, n, r, i) { var o = "nth" !== e.slice(0, 3), a = "last" !== e.slice(-4), s = "of-type" === t; return 1 === r && 0 === i ? function (e) { return !!e.parentNode } : function (t, n, u) { var l, c, f, p, d, h, g = o !== a ? "nextSibling" : "previousSibling", y = t.parentNode, v = s && t.nodeName.toLowerCase(), m = !u && !s, x = !1; if (y) { if (o) { while (g) { p = t; while (p = p[g]) if (s ? p.nodeName.toLowerCase() === v : 1 === p.nodeType) return !1; h = g = "only" === e && !h && "nextSibling" } return !0 } if (h = [a ? y.firstChild : y.lastChild], a && m) { x = (d = (l = (c = (f = (p = y)[b] || (p[b] = {}))[p.uniqueID] || (f[p.uniqueID] = {}))[e] || [])[0] === T && l[1]) && l[2], p = d && y.childNodes[d]; while (p = ++d && p && p[g] || (x = d = 0) || h.pop()) if (1 === p.nodeType && ++x && p === t) { c[e] = [T, d, x]; break } } else if (m && (x = d = (l = (c = (f = (p = t)[b] || (p[b] = {}))[p.uniqueID] || (f[p.uniqueID] = {}))[e] || [])[0] === T && l[1]), !1 === x) while (p = ++d && p && p[g] || (x = d = 0) || h.pop()) if ((s ? p.nodeName.toLowerCase() === v : 1 === p.nodeType) && ++x && (m && ((c = (f = p[b] || (p[b] = {}))[p.uniqueID] || (f[p.uniqueID] = {}))[e] = [T, x]), p === t)) break; return (x -= i) === r || x % r == 0 && x / r >= 0 } } }, PSEUDO: function (e, t) { var n, i = r.pseudos[e] || r.setFilters[e.toLowerCase()] || oe.error("unsupported pseudo: " + e); return i[b] ? i(t) : i.length > 1 ? (n = [e, e, "", t], r.setFilters.hasOwnProperty(e.toLowerCase()) ? se(function (e, n) { var r, o = i(e, t), a = o.length; while (a--) e[r = O(e, o[a])] = !(n[r] = o[a]) }) : function (e) { return i(e, 0, n) }) : i } }, pseudos: { not: se(function (e) { var t = [], n = [], r = s(e.replace(B, "$1")); return r[b] ? se(function (e, t, n, i) { var o, a = r(e, null, i, []), s = e.length; while (s--) (o = a[s]) && (e[s] = !(t[s] = o)) }) : function (e, i, o) { return t[0] = e, r(t, null, o, n), t[0] = null, !n.pop() } }), has: se(function (e) { return function (t) { return oe(e, t).length > 0 } }), contains: se(function (e) { return e = e.replace(Z, ee), function (t) { return (t.textContent || t.innerText || i(t)).indexOf(e) > -1 } }), lang: se(function (e) { return U.test(e || "") || oe.error("unsupported lang: " + e), e = e.replace(Z, ee).toLowerCase(), function (t) { var n; do { if (n = g ? t.lang : t.getAttribute("xml:lang") || t.getAttribute("lang")) return (n = n.toLowerCase()) === e || 0 === n.indexOf(e + "-") } while ((t = t.parentNode) && 1 === t.nodeType); return !1 } }), target: function (t) { var n = e.location && e.location.hash; return n && n.slice(1) === t.id }, root: function (e) { return e === h }, focus: function (e) { return e === d.activeElement && (!d.hasFocus || d.hasFocus()) && !!(e.type || e.href || ~e.tabIndex) }, enabled: de(!1), disabled: de(!0), checked: function (e) { var t = e.nodeName.toLowerCase(); return "input" === t && !!e.checked || "option" === t && !!e.selected }, selected: function (e) { return e.parentNode && e.parentNode.selectedIndex, !0 === e.selected }, empty: function (e) { for (e = e.firstChild; e; e = e.nextSibling)if (e.nodeType < 6) return !1; return !0 }, parent: function (e) { return !r.pseudos.empty(e) }, header: function (e) { return Y.test(e.nodeName) }, input: function (e) { return G.test(e.nodeName) }, button: function (e) { var t = e.nodeName.toLowerCase(); return "input" === t && "button" === e.type || "button" === t }, text: function (e) { var t; return "input" === e.nodeName.toLowerCase() && "text" === e.type && (null == (t = e.getAttribute("type")) || "text" === t.toLowerCase()) }, first: he(function () { return [0] }), last: he(function (e, t) { return [t - 1] }), eq: he(function (e, t, n) { return [n < 0 ? n + t : n] }), even: he(function (e, t) { for (var n = 0; n < t; n += 2)e.push(n); return e }), odd: he(function (e, t) { for (var n = 1; n < t; n += 2)e.push(n); return e }), lt: he(function (e, t, n) { for (var r = n < 0 ? n + t : n; --r >= 0;)e.push(r); return e }), gt: he(function (e, t, n) { for (var r = n < 0 ? n + t : n; ++r < t;)e.push(r); return e }) } }).pseudos.nth = r.pseudos.eq; for (t in { radio: !0, checkbox: !0, file: !0, password: !0, image: !0 }) r.pseudos[t] = fe(t); for (t in { submit: !0, reset: !0 }) r.pseudos[t] = pe(t); function ye() { } ye.prototype = r.filters = r.pseudos, r.setFilters = new ye, a = oe.tokenize = function (e, t) { var n, i, o, a, s, u, l, c = k[e + " "]; if (c) return t ? 0 : c.slice(0); s = e, u = [], l = r.preFilter; while (s) { n && !(i = F.exec(s)) || (i && (s = s.slice(i[0].length) || s), u.push(o = [])), n = !1, (i = _.exec(s)) && (n = i.shift(), o.push({ value: n, type: i[0].replace(B, " ") }), s = s.slice(n.length)); for (a in r.filter) !(i = V[a].exec(s)) || l[a] && !(i = l[a](i)) || (n = i.shift(), o.push({ value: n, type: a, matches: i }), s = s.slice(n.length)); if (!n) break } return t ? s.length : s ? oe.error(e) : k(e, u).slice(0) }; function ve(e) { for (var t = 0, n = e.length, r = ""; t < n; t++)r += e[t].value; return r } function me(e, t, n) { var r = t.dir, i = t.next, o = i || r, a = n && "parentNode" === o, s = C++; return t.first ? function (t, n, i) { while (t = t[r]) if (1 === t.nodeType || a) return e(t, n, i); return !1 } : function (t, n, u) { var l, c, f, p = [T, s]; if (u) { while (t = t[r]) if ((1 === t.nodeType || a) && e(t, n, u)) return !0 } else while (t = t[r]) if (1 === t.nodeType || a) if (f = t[b] || (t[b] = {}), c = f[t.uniqueID] || (f[t.uniqueID] = {}), i && i === t.nodeName.toLowerCase()) t = t[r] || t; else { if ((l = c[o]) && l[0] === T && l[1] === s) return p[2] = l[2]; if (c[o] = p, p[2] = e(t, n, u)) return !0 } return !1 } } function xe(e) { return e.length > 1 ? function (t, n, r) { var i = e.length; while (i--) if (!e[i](t, n, r)) return !1; return !0 } : e[0] } function be(e, t, n) { for (var r = 0, i = t.length; r < i; r++)oe(e, t[r], n); return n } function we(e, t, n, r, i) { for (var o, a = [], s = 0, u = e.length, l = null != t; s < u; s++)(o = e[s]) && (n && !n(o, r, i) || (a.push(o), l && t.push(s))); return a } function Te(e, t, n, r, i, o) { return r && !r[b] && (r = Te(r)), i && !i[b] && (i = Te(i, o)), se(function (o, a, s, u) { var l, c, f, p = [], d = [], h = a.length, g = o || be(t || "*", s.nodeType ? [s] : s, []), y = !e || !o && t ? g : we(g, p, e, s, u), v = n ? i || (o ? e : h || r) ? [] : a : y; if (n && n(y, v, s, u), r) { l = we(v, d), r(l, [], s, u), c = l.length; while (c--) (f = l[c]) && (v[d[c]] = !(y[d[c]] = f)) } if (o) { if (i || e) { if (i) { l = [], c = v.length; while (c--) (f = v[c]) && l.push(y[c] = f); i(null, v = [], l, u) } c = v.length; while (c--) (f = v[c]) && (l = i ? O(o, f) : p[c]) > -1 && (o[l] = !(a[l] = f)) } } else v = we(v === a ? v.splice(h, v.length) : v), i ? i(null, a, v, u) : L.apply(a, v) }) } function Ce(e) { for (var t, n, i, o = e.length, a = r.relative[e[0].type], s = a || r.relative[" "], u = a ? 1 : 0, c = me(function (e) { return e === t }, s, !0), f = me(function (e) { return O(t, e) > -1 }, s, !0), p = [function (e, n, r) { var i = !a && (r || n !== l) || ((t = n).nodeType ? c(e, n, r) : f(e, n, r)); return t = null, i }]; u < o; u++)if (n = r.relative[e[u].type]) p = [me(xe(p), n)]; else { if ((n = r.filter[e[u].type].apply(null, e[u].matches))[b]) { for (i = ++u; i < o; i++)if (r.relative[e[i].type]) break; return Te(u > 1 && xe(p), u > 1 && ve(e.slice(0, u - 1).concat({ value: " " === e[u - 2].type ? "*" : "" })).replace(B, "$1"), n, u < i && Ce(e.slice(u, i)), i < o && Ce(e = e.slice(i)), i < o && ve(e)) } p.push(n) } return xe(p) } function Ee(e, t) { var n = t.length > 0, i = e.length > 0, o = function (o, a, s, u, c) { var f, h, y, v = 0, m = "0", x = o && [], b = [], w = l, C = o || i && r.find.TAG("*", c), E = T += null == w ? 1 : Math.random() || .1, k = C.length; for (c && (l = a === d || a || c); m !== k && null != (f = C[m]); m++) { if (i && f) { h = 0, a || f.ownerDocument === d || (p(f), s = !g); while (y = e[h++]) if (y(f, a || d, s)) { u.push(f); break } c && (T = E) } n && ((f = !y && f) && v-- , o && x.push(f)) } if (v += m, n && m !== v) { h = 0; while (y = t[h++]) y(x, b, a, s); if (o) { if (v > 0) while (m--) x[m] || b[m] || (b[m] = j.call(u)); b = we(b) } L.apply(u, b), c && !o && b.length > 0 && v + t.length > 1 && oe.uniqueSort(u) } return c && (T = E, l = w), x }; return n ? se(o) : o } return s = oe.compile = function (e, t) { var n, r = [], i = [], o = S[e + " "]; if (!o) { t || (t = a(e)), n = t.length; while (n--) (o = Ce(t[n]))[b] ? r.push(o) : i.push(o); (o = S(e, Ee(i, r))).selector = e } return o }, u = oe.select = function (e, t, n, i) { var o, u, l, c, f, p = "function" == typeof e && e, d = !i && a(e = p.selector || e); if (n = n || [], 1 === d.length) { if ((u = d[0] = d[0].slice(0)).length > 2 && "ID" === (l = u[0]).type && 9 === t.nodeType && g && r.relative[u[1].type]) { if (!(t = (r.find.ID(l.matches[0].replace(Z, ee), t) || [])[0])) return n; p && (t = t.parentNode), e = e.slice(u.shift().value.length) } o = V.needsContext.test(e) ? 0 : u.length; while (o--) { if (l = u[o], r.relative[c = l.type]) break; if ((f = r.find[c]) && (i = f(l.matches[0].replace(Z, ee), K.test(u[0].type) && ge(t.parentNode) || t))) { if (u.splice(o, 1), !(e = i.length && ve(u))) return L.apply(n, i), n; break } } } return (p || s(e, d))(i, t, !g, n, !t || K.test(e) && ge(t.parentNode) || t), n }, n.sortStable = b.split("").sort(D).join("") === b, n.detectDuplicates = !!f, p(), n.sortDetached = ue(function (e) { return 1 & e.compareDocumentPosition(d.createElement("fieldset")) }), ue(function (e) { return e.innerHTML = "<a href='#'></a>", "#" === e.firstChild.getAttribute("href") }) || le("type|href|height|width", function (e, t, n) { if (!n) return e.getAttribute(t, "type" === t.toLowerCase() ? 1 : 2) }), n.attributes && ue(function (e) { return e.innerHTML = "<input/>", e.firstChild.setAttribute("value", ""), "" === e.firstChild.getAttribute("value") }) || le("value", function (e, t, n) { if (!n && "input" === e.nodeName.toLowerCase()) return e.defaultValue }), ue(function (e) { return null == e.getAttribute("disabled") }) || le(P, function (e, t, n) { var r; if (!n) return !0 === e[t] ? t.toLowerCase() : (r = e.getAttributeNode(t)) && r.specified ? r.value : null }), oe }(e); w.find = E, w.expr = E.selectors, w.expr[":"] = w.expr.pseudos, w.uniqueSort = w.unique = E.uniqueSort, w.text = E.getText, w.isXMLDoc = E.isXML, w.contains = E.contains, w.escapeSelector = E.escape; var k = function (e, t, n) { var r = [], i = void 0 !== n; while ((e = e[t]) && 9 !== e.nodeType) if (1 === e.nodeType) { if (i && w(e).is(n)) break; r.push(e) } return r }, S = function (e, t) { for (var n = []; e; e = e.nextSibling)1 === e.nodeType && e !== t && n.push(e); return n }, D = w.expr.match.needsContext; function N(e, t) { return e.nodeName && e.nodeName.toLowerCase() === t.toLowerCase() } var A = /^<([a-z][^\/\0>:\x20\t\r\n\f]*)[\x20\t\r\n\f]*\/?>(?:<\/\1>|)$/i; function j(e, t, n) { return g(t) ? w.grep(e, function (e, r) { return !!t.call(e, r, e) !== n }) : t.nodeType ? w.grep(e, function (e) { return e === t !== n }) : "string" != typeof t ? w.grep(e, function (e) { return u.call(t, e) > -1 !== n }) : w.filter(t, e, n) } w.filter = function (e, t, n) { var r = t[0]; return n && (e = ":not(" + e + ")"), 1 === t.length && 1 === r.nodeType ? w.find.matchesSelector(r, e) ? [r] : [] : w.find.matches(e, w.grep(t, function (e) { return 1 === e.nodeType })) }, w.fn.extend({ find: function (e) { var t, n, r = this.length, i = this; if ("string" != typeof e) return this.pushStack(w(e).filter(function () { for (t = 0; t < r; t++)if (w.contains(i[t], this)) return !0 })); for (n = this.pushStack([]), t = 0; t < r; t++)w.find(e, i[t], n); return r > 1 ? w.uniqueSort(n) : n }, filter: function (e) { return this.pushStack(j(this, e || [], !1)) }, not: function (e) { return this.pushStack(j(this, e || [], !0)) }, is: function (e) { return !!j(this, "string" == typeof e && D.test(e) ? w(e) : e || [], !1).length } }); var q, L = /^(?:\s*(<[\w\W]+>)[^>]*|#([\w-]+))$/; (w.fn.init = function (e, t, n) { var i, o; if (!e) return this; if (n = n || q, "string" == typeof e) { if (!(i = "<" === e[0] && ">" === e[e.length - 1] && e.length >= 3 ? [null, e, null] : L.exec(e)) || !i[1] && t) return !t || t.jquery ? (t || n).find(e) : this.constructor(t).find(e); if (i[1]) { if (t = t instanceof w ? t[0] : t, w.merge(this, w.parseHTML(i[1], t && t.nodeType ? t.ownerDocument || t : r, !0)), A.test(i[1]) && w.isPlainObject(t)) for (i in t) g(this[i]) ? this[i](t[i]) : this.attr(i, t[i]); return this } return (o = r.getElementById(i[2])) && (this[0] = o, this.length = 1), this } return e.nodeType ? (this[0] = e, this.length = 1, this) : g(e) ? void 0 !== n.ready ? n.ready(e) : e(w) : w.makeArray(e, this) }).prototype = w.fn, q = w(r); var H = /^(?:parents|prev(?:Until|All))/, O = { children: !0, contents: !0, next: !0, prev: !0 }; w.fn.extend({ has: function (e) { var t = w(e, this), n = t.length; return this.filter(function () { for (var e = 0; e < n; e++)if (w.contains(this, t[e])) return !0 }) }, closest: function (e, t) { var n, r = 0, i = this.length, o = [], a = "string" != typeof e && w(e); if (!D.test(e)) for (; r < i; r++)for (n = this[r]; n && n !== t; n = n.parentNode)if (n.nodeType < 11 && (a ? a.index(n) > -1 : 1 === n.nodeType && w.find.matchesSelector(n, e))) { o.push(n); break } return this.pushStack(o.length > 1 ? w.uniqueSort(o) : o) }, index: function (e) { return e ? "string" == typeof e ? u.call(w(e), this[0]) : u.call(this, e.jquery ? e[0] : e) : this[0] && this[0].parentNode ? this.first().prevAll().length : -1 }, add: function (e, t) { return this.pushStack(w.uniqueSort(w.merge(this.get(), w(e, t)))) }, addBack: function (e) { return this.add(null == e ? this.prevObject : this.prevObject.filter(e)) } }); function P(e, t) { while ((e = e[t]) && 1 !== e.nodeType); return e } w.each({ parent: function (e) { var t = e.parentNode; return t && 11 !== t.nodeType ? t : null }, parents: function (e) { return k(e, "parentNode") }, parentsUntil: function (e, t, n) { return k(e, "parentNode", n) }, next: function (e) { return P(e, "nextSibling") }, prev: function (e) { return P(e, "previousSibling") }, nextAll: function (e) { return k(e, "nextSibling") }, prevAll: function (e) { return k(e, "previousSibling") }, nextUntil: function (e, t, n) { return k(e, "nextSibling", n) }, prevUntil: function (e, t, n) { return k(e, "previousSibling", n) }, siblings: function (e) { return S((e.parentNode || {}).firstChild, e) }, children: function (e) { return S(e.firstChild) }, contents: function (e) { return N(e, "iframe") ? e.contentDocument : (N(e, "template") && (e = e.content || e), w.merge([], e.childNodes)) } }, function (e, t) { w.fn[e] = function (n, r) { var i = w.map(this, t, n); return "Until" !== e.slice(-5) && (r = n), r && "string" == typeof r && (i = w.filter(r, i)), this.length > 1 && (O[e] || w.uniqueSort(i), H.test(e) && i.reverse()), this.pushStack(i) } }); var M = /[^\x20\t\r\n\f]+/g; function R(e) { var t = {}; return w.each(e.match(M) || [], function (e, n) { t[n] = !0 }), t } w.Callbacks = function (e) { e = "string" == typeof e ? R(e) : w.extend({}, e); var t, n, r, i, o = [], a = [], s = -1, u = function () { for (i = i || e.once, r = t = !0; a.length; s = -1) { n = a.shift(); while (++s < o.length) !1 === o[s].apply(n[0], n[1]) && e.stopOnFalse && (s = o.length, n = !1) } e.memory || (n = !1), t = !1, i && (o = n ? [] : "") }, l = { add: function () { return o && (n && !t && (s = o.length - 1, a.push(n)), function t(n) { w.each(n, function (n, r) { g(r) ? e.unique && l.has(r) || o.push(r) : r && r.length && "string" !== x(r) && t(r) }) }(arguments), n && !t && u()), this }, remove: function () { return w.each(arguments, function (e, t) { var n; while ((n = w.inArray(t, o, n)) > -1) o.splice(n, 1), n <= s && s-- }), this }, has: function (e) { return e ? w.inArray(e, o) > -1 : o.length > 0 }, empty: function () { return o && (o = []), this }, disable: function () { return i = a = [], o = n = "", this }, disabled: function () { return !o }, lock: function () { return i = a = [], n || t || (o = n = ""), this }, locked: function () { return !!i }, fireWith: function (e, n) { return i || (n = [e, (n = n || []).slice ? n.slice() : n], a.push(n), t || u()), this }, fire: function () { return l.fireWith(this, arguments), this }, fired: function () { return !!r } }; return l }; function I(e) { return e } function W(e) { throw e } function $(e, t, n, r) { var i; try { e && g(i = e.promise) ? i.call(e).done(t).fail(n) : e && g(i = e.then) ? i.call(e, t, n) : t.apply(void 0, [e].slice(r)) } catch (e) { n.apply(void 0, [e]) } } w.extend({ Deferred: function (t) { var n = [["notify", "progress", w.Callbacks("memory"), w.Callbacks("memory"), 2], ["resolve", "done", w.Callbacks("once memory"), w.Callbacks("once memory"), 0, "resolved"], ["reject", "fail", w.Callbacks("once memory"), w.Callbacks("once memory"), 1, "rejected"]], r = "pending", i = { state: function () { return r }, always: function () { return o.done(arguments).fail(arguments), this }, "catch": function (e) { return i.then(null, e) }, pipe: function () { var e = arguments; return w.Deferred(function (t) { w.each(n, function (n, r) { var i = g(e[r[4]]) && e[r[4]]; o[r[1]](function () { var e = i && i.apply(this, arguments); e && g(e.promise) ? e.promise().progress(t.notify).done(t.resolve).fail(t.reject) : t[r[0] + "With"](this, i ? [e] : arguments) }) }), e = null }).promise() }, then: function (t, r, i) { var o = 0; function a(t, n, r, i) { return function () { var s = this, u = arguments, l = function () { var e, l; if (!(t < o)) { if ((e = r.apply(s, u)) === n.promise()) throw new TypeError("Thenable self-resolution"); l = e && ("object" == typeof e || "function" == typeof e) && e.then, g(l) ? i ? l.call(e, a(o, n, I, i), a(o, n, W, i)) : (o++ , l.call(e, a(o, n, I, i), a(o, n, W, i), a(o, n, I, n.notifyWith))) : (r !== I && (s = void 0, u = [e]), (i || n.resolveWith)(s, u)) } }, c = i ? l : function () { try { l() } catch (e) { w.Deferred.exceptionHook && w.Deferred.exceptionHook(e, c.stackTrace), t + 1 >= o && (r !== W && (s = void 0, u = [e]), n.rejectWith(s, u)) } }; t ? c() : (w.Deferred.getStackHook && (c.stackTrace = w.Deferred.getStackHook()), e.setTimeout(c)) } } return w.Deferred(function (e) { n[0][3].add(a(0, e, g(i) ? i : I, e.notifyWith)), n[1][3].add(a(0, e, g(t) ? t : I)), n[2][3].add(a(0, e, g(r) ? r : W)) }).promise() }, promise: function (e) { return null != e ? w.extend(e, i) : i } }, o = {}; return w.each(n, function (e, t) { var a = t[2], s = t[5]; i[t[1]] = a.add, s && a.add(function () { r = s }, n[3 - e][2].disable, n[3 - e][3].disable, n[0][2].lock, n[0][3].lock), a.add(t[3].fire), o[t[0]] = function () { return o[t[0] + "With"](this === o ? void 0 : this, arguments), this }, o[t[0] + "With"] = a.fireWith }), i.promise(o), t && t.call(o, o), o }, when: function (e) { var t = arguments.length, n = t, r = Array(n), i = o.call(arguments), a = w.Deferred(), s = function (e) { return function (n) { r[e] = this, i[e] = arguments.length > 1 ? o.call(arguments) : n, --t || a.resolveWith(r, i) } }; if (t <= 1 && ($(e, a.done(s(n)).resolve, a.reject, !t), "pending" === a.state() || g(i[n] && i[n].then))) return a.then(); while (n--) $(i[n], s(n), a.reject); return a.promise() } }); var B = /^(Eval|Internal|Range|Reference|Syntax|Type|URI)Error$/; w.Deferred.exceptionHook = function (t, n) { e.console && e.console.warn && t && B.test(t.name) && e.console.warn("jQuery.Deferred exception: " + t.message, t.stack, n) }, w.readyException = function (t) { e.setTimeout(function () { throw t }) }; var F = w.Deferred(); w.fn.ready = function (e) { return F.then(e)["catch"](function (e) { w.readyException(e) }), this }, w.extend({ isReady: !1, readyWait: 1, ready: function (e) { (!0 === e ? --w.readyWait : w.isReady) || (w.isReady = !0, !0 !== e && --w.readyWait > 0 || F.resolveWith(r, [w])) } }), w.ready.then = F.then; function _() { r.removeEventListener("DOMContentLoaded", _), e.removeEventListener("load", _), w.ready() } "complete" === r.readyState || "loading" !== r.readyState && !r.documentElement.doScroll ? e.setTimeout(w.ready) : (r.addEventListener("DOMContentLoaded", _), e.addEventListener("load", _)); var z = function (e, t, n, r, i, o, a) { var s = 0, u = e.length, l = null == n; if ("object" === x(n)) { i = !0; for (s in n) z(e, t, s, n[s], !0, o, a) } else if (void 0 !== r && (i = !0, g(r) || (a = !0), l && (a ? (t.call(e, r), t = null) : (l = t, t = function (e, t, n) { return l.call(w(e), n) })), t)) for (; s < u; s++)t(e[s], n, a ? r : r.call(e[s], s, t(e[s], n))); return i ? e : l ? t.call(e) : u ? t(e[0], n) : o }, X = /^-ms-/, U = /-([a-z])/g; function V(e, t) { return t.toUpperCase() } function G(e) { return e.replace(X, "ms-").replace(U, V) } var Y = function (e) { return 1 === e.nodeType || 9 === e.nodeType || !+e.nodeType }; function Q() { this.expando = w.expando + Q.uid++ } Q.uid = 1, Q.prototype = { cache: function (e) { var t = e[this.expando]; return t || (t = {}, Y(e) && (e.nodeType ? e[this.expando] = t : Object.defineProperty(e, this.expando, { value: t, configurable: !0 }))), t }, set: function (e, t, n) { var r, i = this.cache(e); if ("string" == typeof t) i[G(t)] = n; else for (r in t) i[G(r)] = t[r]; return i }, get: function (e, t) { return void 0 === t ? this.cache(e) : e[this.expando] && e[this.expando][G(t)] }, access: function (e, t, n) { return void 0 === t || t && "string" == typeof t && void 0 === n ? this.get(e, t) : (this.set(e, t, n), void 0 !== n ? n : t) }, remove: function (e, t) { var n, r = e[this.expando]; if (void 0 !== r) { if (void 0 !== t) { n = (t = Array.isArray(t) ? t.map(G) : (t = G(t)) in r ? [t] : t.match(M) || []).length; while (n--) delete r[t[n]] } (void 0 === t || w.isEmptyObject(r)) && (e.nodeType ? e[this.expando] = void 0 : delete e[this.expando]) } }, hasData: function (e) { var t = e[this.expando]; return void 0 !== t && !w.isEmptyObject(t) } }; var J = new Q, K = new Q, Z = /^(?:\{[\w\W]*\}|\[[\w\W]*\])$/, ee = /[A-Z]/g; function te(e) { return "true" === e || "false" !== e && ("null" === e ? null : e === +e + "" ? +e : Z.test(e) ? JSON.parse(e) : e) } function ne(e, t, n) { var r; if (void 0 === n && 1 === e.nodeType) if (r = "data-" + t.replace(ee, "-$&").toLowerCase(), "string" == typeof (n = e.getAttribute(r))) { try { n = te(n) } catch (e) { } K.set(e, t, n) } else n = void 0; return n } w.extend({ hasData: function (e) { return K.hasData(e) || J.hasData(e) }, data: function (e, t, n) { return K.access(e, t, n) }, removeData: function (e, t) { K.remove(e, t) }, _data: function (e, t, n) { return J.access(e, t, n) }, _removeData: function (e, t) { J.remove(e, t) } }), w.fn.extend({ data: function (e, t) { var n, r, i, o = this[0], a = o && o.attributes; if (void 0 === e) { if (this.length && (i = K.get(o), 1 === o.nodeType && !J.get(o, "hasDataAttrs"))) { n = a.length; while (n--) a[n] && 0 === (r = a[n].name).indexOf("data-") && (r = G(r.slice(5)), ne(o, r, i[r])); J.set(o, "hasDataAttrs", !0) } return i } return "object" == typeof e ? this.each(function () { K.set(this, e) }) : z(this, function (t) { var n; if (o && void 0 === t) { if (void 0 !== (n = K.get(o, e))) return n; if (void 0 !== (n = ne(o, e))) return n } else this.each(function () { K.set(this, e, t) }) }, null, t, arguments.length > 1, null, !0) }, removeData: function (e) { return this.each(function () { K.remove(this, e) }) } }), w.extend({ queue: function (e, t, n) { var r; if (e) return t = (t || "fx") + "queue", r = J.get(e, t), n && (!r || Array.isArray(n) ? r = J.access(e, t, w.makeArray(n)) : r.push(n)), r || [] }, dequeue: function (e, t) { t = t || "fx"; var n = w.queue(e, t), r = n.length, i = n.shift(), o = w._queueHooks(e, t), a = function () { w.dequeue(e, t) }; "inprogress" === i && (i = n.shift(), r--), i && ("fx" === t && n.unshift("inprogress"), delete o.stop, i.call(e, a, o)), !r && o && o.empty.fire() }, _queueHooks: function (e, t) { var n = t + "queueHooks"; return J.get(e, n) || J.access(e, n, { empty: w.Callbacks("once memory").add(function () { J.remove(e, [t + "queue", n]) }) }) } }), w.fn.extend({ queue: function (e, t) { var n = 2; return "string" != typeof e && (t = e, e = "fx", n--), arguments.length < n ? w.queue(this[0], e) : void 0 === t ? this : this.each(function () { var n = w.queue(this, e, t); w._queueHooks(this, e), "fx" === e && "inprogress" !== n[0] && w.dequeue(this, e) }) }, dequeue: function (e) { return this.each(function () { w.dequeue(this, e) }) }, clearQueue: function (e) { return this.queue(e || "fx", []) }, promise: function (e, t) { var n, r = 1, i = w.Deferred(), o = this, a = this.length, s = function () { --r || i.resolveWith(o, [o]) }; "string" != typeof e && (t = e, e = void 0), e = e || "fx"; while (a--) (n = J.get(o[a], e + "queueHooks")) && n.empty && (r++ , n.empty.add(s)); return s(), i.promise(t) } }); var re = /[+-]?(?:\d*\.|)\d+(?:[eE][+-]?\d+|)/.source, ie = new RegExp("^(?:([+-])=|)(" + re + ")([a-z%]*)$", "i"), oe = ["Top", "Right", "Bottom", "Left"], ae = function (e, t) { return "none" === (e = t || e).style.display || "" === e.style.display && w.contains(e.ownerDocument, e) && "none" === w.css(e, "display") }, se = function (e, t, n, r) { var i, o, a = {}; for (o in t) a[o] = e.style[o], e.style[o] = t[o]; i = n.apply(e, r || []); for (o in t) e.style[o] = a[o]; return i }; function ue(e, t, n, r) { var i, o, a = 20, s = r ? function () { return r.cur() } : function () { return w.css(e, t, "") }, u = s(), l = n && n[3] || (w.cssNumber[t] ? "" : "px"), c = (w.cssNumber[t] || "px" !== l && +u) && ie.exec(w.css(e, t)); if (c && c[3] !== l) { u /= 2, l = l || c[3], c = +u || 1; while (a--) w.style(e, t, c + l), (1 - o) * (1 - (o = s() / u || .5)) <= 0 && (a = 0), c /= o; c *= 2, w.style(e, t, c + l), n = n || [] } return n && (c = +c || +u || 0, i = n[1] ? c + (n[1] + 1) * n[2] : +n[2], r && (r.unit = l, r.start = c, r.end = i)), i } var le = {}; function ce(e) { var t, n = e.ownerDocument, r = e.nodeName, i = le[r]; return i || (t = n.body.appendChild(n.createElement(r)), i = w.css(t, "display"), t.parentNode.removeChild(t), "none" === i && (i = "block"), le[r] = i, i) } function fe(e, t) { for (var n, r, i = [], o = 0, a = e.length; o < a; o++)(r = e[o]).style && (n = r.style.display, t ? ("none" === n && (i[o] = J.get(r, "display") || null, i[o] || (r.style.display = "")), "" === r.style.display && ae(r) && (i[o] = ce(r))) : "none" !== n && (i[o] = "none", J.set(r, "display", n))); for (o = 0; o < a; o++)null != i[o] && (e[o].style.display = i[o]); return e } w.fn.extend({ show: function () { return fe(this, !0) }, hide: function () { return fe(this) }, toggle: function (e) { return "boolean" == typeof e ? e ? this.show() : this.hide() : this.each(function () { ae(this) ? w(this).show() : w(this).hide() }) } }); var pe = /^(?:checkbox|radio)$/i, de = /<([a-z][^\/\0>\x20\t\r\n\f]+)/i, he = /^$|^module$|\/(?:java|ecma)script/i, ge = { option: [1, "<select multiple='multiple'>", "</select>"], thead: [1, "<table>", "</table>"], col: [2, "<table><colgroup>", "</colgroup></table>"], tr: [2, "<table><tbody>", "</tbody></table>"], td: [3, "<table><tbody><tr>", "</tr></tbody></table>"], _default: [0, "", ""] }; ge.optgroup = ge.option, ge.tbody = ge.tfoot = ge.colgroup = ge.caption = ge.thead, ge.th = ge.td; function ye(e, t) { var n; return n = "undefined" != typeof e.getElementsByTagName ? e.getElementsByTagName(t || "*") : "undefined" != typeof e.querySelectorAll ? e.querySelectorAll(t || "*") : [], void 0 === t || t && N(e, t) ? w.merge([e], n) : n } function ve(e, t) { for (var n = 0, r = e.length; n < r; n++)J.set(e[n], "globalEval", !t || J.get(t[n], "globalEval")) } var me = /<|&#?\w+;/; function xe(e, t, n, r, i) { for (var o, a, s, u, l, c, f = t.createDocumentFragment(), p = [], d = 0, h = e.length; d < h; d++)if ((o = e[d]) || 0 === o) if ("object" === x(o)) w.merge(p, o.nodeType ? [o] : o); else if (me.test(o)) { a = a || f.appendChild(t.createElement("div")), s = (de.exec(o) || ["", ""])[1].toLowerCase(), u = ge[s] || ge._default, a.innerHTML = u[1] + w.htmlPrefilter(o) + u[2], c = u[0]; while (c--) a = a.lastChild; w.merge(p, a.childNodes), (a = f.firstChild).textContent = "" } else p.push(t.createTextNode(o)); f.textContent = "", d = 0; while (o = p[d++]) if (r && w.inArray(o, r) > -1) i && i.push(o); else if (l = w.contains(o.ownerDocument, o), a = ye(f.appendChild(o), "script"), l && ve(a), n) { c = 0; while (o = a[c++]) he.test(o.type || "") && n.push(o) } return f } !function () { var e = r.createDocumentFragment().appendChild(r.createElement("div")), t = r.createElement("input"); t.setAttribute("type", "radio"), t.setAttribute("checked", "checked"), t.setAttribute("name", "t"), e.appendChild(t), h.checkClone = e.cloneNode(!0).cloneNode(!0).lastChild.checked, e.innerHTML = "<textarea>x</textarea>", h.noCloneChecked = !!e.cloneNode(!0).lastChild.defaultValue }(); var be = r.documentElement, we = /^key/, Te = /^(?:mouse|pointer|contextmenu|drag|drop)|click/, Ce = /^([^.]*)(?:\.(.+)|)/; function Ee() { return !0 } function ke() { return !1 } function Se() { try { return r.activeElement } catch (e) { } } function De(e, t, n, r, i, o) { var a, s; if ("object" == typeof t) { "string" != typeof n && (r = r || n, n = void 0); for (s in t) De(e, s, n, r, t[s], o); return e } if (null == r && null == i ? (i = n, r = n = void 0) : null == i && ("string" == typeof n ? (i = r, r = void 0) : (i = r, r = n, n = void 0)), !1 === i) i = ke; else if (!i) return e; return 1 === o && (a = i, (i = function (e) { return w().off(e), a.apply(this, arguments) }).guid = a.guid || (a.guid = w.guid++)), e.each(function () { w.event.add(this, t, i, r, n) }) } w.event = { global: {}, add: function (e, t, n, r, i) { var o, a, s, u, l, c, f, p, d, h, g, y = J.get(e); if (y) { n.handler && (n = (o = n).handler, i = o.selector), i && w.find.matchesSelector(be, i), n.guid || (n.guid = w.guid++), (u = y.events) || (u = y.events = {}), (a = y.handle) || (a = y.handle = function (t) { return "undefined" != typeof w && w.event.triggered !== t.type ? w.event.dispatch.apply(e, arguments) : void 0 }), l = (t = (t || "").match(M) || [""]).length; while (l--) d = g = (s = Ce.exec(t[l]) || [])[1], h = (s[2] || "").split(".").sort(), d && (f = w.event.special[d] || {}, d = (i ? f.delegateType : f.bindType) || d, f = w.event.special[d] || {}, c = w.extend({ type: d, origType: g, data: r, handler: n, guid: n.guid, selector: i, needsContext: i && w.expr.match.needsContext.test(i), namespace: h.join(".") }, o), (p = u[d]) || ((p = u[d] = []).delegateCount = 0, f.setup && !1 !== f.setup.call(e, r, h, a) || e.addEventListener && e.addEventListener(d, a)), f.add && (f.add.call(e, c), c.handler.guid || (c.handler.guid = n.guid)), i ? p.splice(p.delegateCount++, 0, c) : p.push(c), w.event.global[d] = !0) } }, remove: function (e, t, n, r, i) { var o, a, s, u, l, c, f, p, d, h, g, y = J.hasData(e) && J.get(e); if (y && (u = y.events)) { l = (t = (t || "").match(M) || [""]).length; while (l--) if (s = Ce.exec(t[l]) || [], d = g = s[1], h = (s[2] || "").split(".").sort(), d) { f = w.event.special[d] || {}, p = u[d = (r ? f.delegateType : f.bindType) || d] || [], s = s[2] && new RegExp("(^|\\.)" + h.join("\\.(?:.*\\.|)") + "(\\.|$)"), a = o = p.length; while (o--) c = p[o], !i && g !== c.origType || n && n.guid !== c.guid || s && !s.test(c.namespace) || r && r !== c.selector && ("**" !== r || !c.selector) || (p.splice(o, 1), c.selector && p.delegateCount-- , f.remove && f.remove.call(e, c)); a && !p.length && (f.teardown && !1 !== f.teardown.call(e, h, y.handle) || w.removeEvent(e, d, y.handle), delete u[d]) } else for (d in u) w.event.remove(e, d + t[l], n, r, !0); w.isEmptyObject(u) && J.remove(e, "handle events") } }, dispatch: function (e) { var t = w.event.fix(e), n, r, i, o, a, s, u = new Array(arguments.length), l = (J.get(this, "events") || {})[t.type] || [], c = w.event.special[t.type] || {}; for (u[0] = t, n = 1; n < arguments.length; n++)u[n] = arguments[n]; if (t.delegateTarget = this, !c.preDispatch || !1 !== c.preDispatch.call(this, t)) { s = w.event.handlers.call(this, t, l), n = 0; while ((o = s[n++]) && !t.isPropagationStopped()) { t.currentTarget = o.elem, r = 0; while ((a = o.handlers[r++]) && !t.isImmediatePropagationStopped()) t.rnamespace && !t.rnamespace.test(a.namespace) || (t.handleObj = a, t.data = a.data, void 0 !== (i = ((w.event.special[a.origType] || {}).handle || a.handler).apply(o.elem, u)) && !1 === (t.result = i) && (t.preventDefault(), t.stopPropagation())) } return c.postDispatch && c.postDispatch.call(this, t), t.result } }, handlers: function (e, t) { var n, r, i, o, a, s = [], u = t.delegateCount, l = e.target; if (u && l.nodeType && !("click" === e.type && e.button >= 1)) for (; l !== this; l = l.parentNode || this)if (1 === l.nodeType && ("click" !== e.type || !0 !== l.disabled)) { for (o = [], a = {}, n = 0; n < u; n++)void 0 === a[i = (r = t[n]).selector + " "] && (a[i] = r.needsContext ? w(i, this).index(l) > -1 : w.find(i, this, null, [l]).length), a[i] && o.push(r); o.length && s.push({ elem: l, handlers: o }) } return l = this, u < t.length && s.push({ elem: l, handlers: t.slice(u) }), s }, addProp: function (e, t) { Object.defineProperty(w.Event.prototype, e, { enumerable: !0, configurable: !0, get: g(t) ? function () { if (this.originalEvent) return t(this.originalEvent) } : function () { if (this.originalEvent) return this.originalEvent[e] }, set: function (t) { Object.defineProperty(this, e, { enumerable: !0, configurable: !0, writable: !0, value: t }) } }) }, fix: function (e) { return e[w.expando] ? e : new w.Event(e) }, special: { load: { noBubble: !0 }, focus: { trigger: function () { if (this !== Se() && this.focus) return this.focus(), !1 }, delegateType: "focusin" }, blur: { trigger: function () { if (this === Se() && this.blur) return this.blur(), !1 }, delegateType: "focusout" }, click: { trigger: function () { if ("checkbox" === this.type && this.click && N(this, "input")) return this.click(), !1 }, _default: function (e) { return N(e.target, "a") } }, beforeunload: { postDispatch: function (e) { void 0 !== e.result && e.originalEvent && (e.originalEvent.returnValue = e.result) } } } }, w.removeEvent = function (e, t, n) { e.removeEventListener && e.removeEventListener(t, n) }, w.Event = function (e, t) { if (!(this instanceof w.Event)) return new w.Event(e, t); e && e.type ? (this.originalEvent = e, this.type = e.type, this.isDefaultPrevented = e.defaultPrevented || void 0 === e.defaultPrevented && !1 === e.returnValue ? Ee : ke, this.target = e.target && 3 === e.target.nodeType ? e.target.parentNode : e.target, this.currentTarget = e.currentTarget, this.relatedTarget = e.relatedTarget) : this.type = e, t && w.extend(this, t), this.timeStamp = e && e.timeStamp || Date.now(), this[w.expando] = !0 }, w.Event.prototype = { constructor: w.Event, isDefaultPrevented: ke, isPropagationStopped: ke, isImmediatePropagationStopped: ke, isSimulated: !1, preventDefault: function () { var e = this.originalEvent; this.isDefaultPrevented = Ee, e && !this.isSimulated && e.preventDefault() }, stopPropagation: function () { var e = this.originalEvent; this.isPropagationStopped = Ee, e && !this.isSimulated && e.stopPropagation() }, stopImmediatePropagation: function () { var e = this.originalEvent; this.isImmediatePropagationStopped = Ee, e && !this.isSimulated && e.stopImmediatePropagation(), this.stopPropagation() } }, w.each({ altKey: !0, bubbles: !0, cancelable: !0, changedTouches: !0, ctrlKey: !0, detail: !0, eventPhase: !0, metaKey: !0, pageX: !0, pageY: !0, shiftKey: !0, view: !0, "char": !0, charCode: !0, key: !0, keyCode: !0, button: !0, buttons: !0, clientX: !0, clientY: !0, offsetX: !0, offsetY: !0, pointerId: !0, pointerType: !0, screenX: !0, screenY: !0, targetTouches: !0, toElement: !0, touches: !0, which: function (e) { var t = e.button; return null == e.which && we.test(e.type) ? null != e.charCode ? e.charCode : e.keyCode : !e.which && void 0 !== t && Te.test(e.type) ? 1 & t ? 1 : 2 & t ? 3 : 4 & t ? 2 : 0 : e.which } }, w.event.addProp), w.each({ mouseenter: "mouseover", mouseleave: "mouseout", pointerenter: "pointerover", pointerleave: "pointerout" }, function (e, t) { w.event.special[e] = { delegateType: t, bindType: t, handle: function (e) { var n, r = this, i = e.relatedTarget, o = e.handleObj; return i && (i === r || w.contains(r, i)) || (e.type = o.origType, n = o.handler.apply(this, arguments), e.type = t), n } } }), w.fn.extend({ on: function (e, t, n, r) { return De(this, e, t, n, r) }, one: function (e, t, n, r) { return De(this, e, t, n, r, 1) }, off: function (e, t, n) { var r, i; if (e && e.preventDefault && e.handleObj) return r = e.handleObj, w(e.delegateTarget).off(r.namespace ? r.origType + "." + r.namespace : r.origType, r.selector, r.handler), this; if ("object" == typeof e) { for (i in e) this.off(i, t, e[i]); return this } return !1 !== t && "function" != typeof t || (n = t, t = void 0), !1 === n && (n = ke), this.each(function () { w.event.remove(this, e, n, t) }) } }); var Ne = /<(?!area|br|col|embed|hr|img|input|link|meta|param)(([a-z][^\/\0>\x20\t\r\n\f]*)[^>]*)\/>/gi, Ae = /<script|<style|<link/i, je = /checked\s*(?:[^=]|=\s*.checked.)/i, qe = /^\s*<!(?:\[CDATA\[|--)|(?:\]\]|--)>\s*$/g; function Le(e, t) { return N(e, "table") && N(11 !== t.nodeType ? t : t.firstChild, "tr") ? w(e).children("tbody")[0] || e : e } function He(e) { return e.type = (null !== e.getAttribute("type")) + "/" + e.type, e } function Oe(e) { return "true/" === (e.type || "").slice(0, 5) ? e.type = e.type.slice(5) : e.removeAttribute("type"), e } function Pe(e, t) { var n, r, i, o, a, s, u, l; if (1 === t.nodeType) { if (J.hasData(e) && (o = J.access(e), a = J.set(t, o), l = o.events)) { delete a.handle, a.events = {}; for (i in l) for (n = 0, r = l[i].length; n < r; n++)w.event.add(t, i, l[i][n]) } K.hasData(e) && (s = K.access(e), u = w.extend({}, s), K.set(t, u)) } } function Me(e, t) { var n = t.nodeName.toLowerCase(); "input" === n && pe.test(e.type) ? t.checked = e.checked : "input" !== n && "textarea" !== n || (t.defaultValue = e.defaultValue) } function Re(e, t, n, r) { t = a.apply([], t); var i, o, s, u, l, c, f = 0, p = e.length, d = p - 1, y = t[0], v = g(y); if (v || p > 1 && "string" == typeof y && !h.checkClone && je.test(y)) return e.each(function (i) { var o = e.eq(i); v && (t[0] = y.call(this, i, o.html())), Re(o, t, n, r) }); if (p && (i = xe(t, e[0].ownerDocument, !1, e, r), o = i.firstChild, 1 === i.childNodes.length && (i = o), o || r)) { for (u = (s = w.map(ye(i, "script"), He)).length; f < p; f++)l = i, f !== d && (l = w.clone(l, !0, !0), u && w.merge(s, ye(l, "script"))), n.call(e[f], l, f); if (u) for (c = s[s.length - 1].ownerDocument, w.map(s, Oe), f = 0; f < u; f++)l = s[f], he.test(l.type || "") && !J.access(l, "globalEval") && w.contains(c, l) && (l.src && "module" !== (l.type || "").toLowerCase() ? w._evalUrl && w._evalUrl(l.src) : m(l.textContent.replace(qe, ""), c, l)) } return e } function Ie(e, t, n) { for (var r, i = t ? w.filter(t, e) : e, o = 0; null != (r = i[o]); o++)n || 1 !== r.nodeType || w.cleanData(ye(r)), r.parentNode && (n && w.contains(r.ownerDocument, r) && ve(ye(r, "script")), r.parentNode.removeChild(r)); return e } w.extend({ htmlPrefilter: function (e) { return e.replace(Ne, "<$1></$2>") }, clone: function (e, t, n) { var r, i, o, a, s = e.cloneNode(!0), u = w.contains(e.ownerDocument, e); if (!(h.noCloneChecked || 1 !== e.nodeType && 11 !== e.nodeType || w.isXMLDoc(e))) for (a = ye(s), r = 0, i = (o = ye(e)).length; r < i; r++)Me(o[r], a[r]); if (t) if (n) for (o = o || ye(e), a = a || ye(s), r = 0, i = o.length; r < i; r++)Pe(o[r], a[r]); else Pe(e, s); return (a = ye(s, "script")).length > 0 && ve(a, !u && ye(e, "script")), s }, cleanData: function (e) { for (var t, n, r, i = w.event.special, o = 0; void 0 !== (n = e[o]); o++)if (Y(n)) { if (t = n[J.expando]) { if (t.events) for (r in t.events) i[r] ? w.event.remove(n, r) : w.removeEvent(n, r, t.handle); n[J.expando] = void 0 } n[K.expando] && (n[K.expando] = void 0) } } }), w.fn.extend({ detach: function (e) { return Ie(this, e, !0) }, remove: function (e) { return Ie(this, e) }, text: function (e) { return z(this, function (e) { return void 0 === e ? w.text(this) : this.empty().each(function () { 1 !== this.nodeType && 11 !== this.nodeType && 9 !== this.nodeType || (this.textContent = e) }) }, null, e, arguments.length) }, append: function () { return Re(this, arguments, function (e) { 1 !== this.nodeType && 11 !== this.nodeType && 9 !== this.nodeType || Le(this, e).appendChild(e) }) }, prepend: function () { return Re(this, arguments, function (e) { if (1 === this.nodeType || 11 === this.nodeType || 9 === this.nodeType) { var t = Le(this, e); t.insertBefore(e, t.firstChild) } }) }, before: function () { return Re(this, arguments, function (e) { this.parentNode && this.parentNode.insertBefore(e, this) }) }, after: function () { return Re(this, arguments, function (e) { this.parentNode && this.parentNode.insertBefore(e, this.nextSibling) }) }, empty: function () { for (var e, t = 0; null != (e = this[t]); t++)1 === e.nodeType && (w.cleanData(ye(e, !1)), e.textContent = ""); return this }, clone: function (e, t) { return e = null != e && e, t = null == t ? e : t, this.map(function () { return w.clone(this, e, t) }) }, html: function (e) { return z(this, function (e) { var t = this[0] || {}, n = 0, r = this.length; if (void 0 === e && 1 === t.nodeType) return t.innerHTML; if ("string" == typeof e && !Ae.test(e) && !ge[(de.exec(e) || ["", ""])[1].toLowerCase()]) { e = w.htmlPrefilter(e); try { for (; n < r; n++)1 === (t = this[n] || {}).nodeType && (w.cleanData(ye(t, !1)), t.innerHTML = e); t = 0 } catch (e) { } } t && this.empty().append(e) }, null, e, arguments.length) }, replaceWith: function () { var e = []; return Re(this, arguments, function (t) { var n = this.parentNode; w.inArray(this, e) < 0 && (w.cleanData(ye(this)), n && n.replaceChild(t, this)) }, e) } }), w.each({ appendTo: "append", prependTo: "prepend", insertBefore: "before", insertAfter: "after", replaceAll: "replaceWith" }, function (e, t) { w.fn[e] = function (e) { for (var n, r = [], i = w(e), o = i.length - 1, a = 0; a <= o; a++)n = a === o ? this : this.clone(!0), w(i[a])[t](n), s.apply(r, n.get()); return this.pushStack(r) } }); var We = new RegExp("^(" + re + ")(?!px)[a-z%]+$", "i"), $e = function (t) { var n = t.ownerDocument.defaultView; return n && n.opener || (n = e), n.getComputedStyle(t) }, Be = new RegExp(oe.join("|"), "i"); !function () { function t() { if (c) { l.style.cssText = "position:absolute;left:-11111px;width:60px;margin-top:1px;padding:0;border:0", c.style.cssText = "position:relative;display:block;box-sizing:border-box;overflow:scroll;margin:auto;border:1px;padding:1px;width:60%;top:1%", be.appendChild(l).appendChild(c); var t = e.getComputedStyle(c); i = "1%" !== t.top, u = 12 === n(t.marginLeft), c.style.right = "60%", s = 36 === n(t.right), o = 36 === n(t.width), c.style.position = "absolute", a = 36 === c.offsetWidth || "absolute", be.removeChild(l), c = null } } function n(e) { return Math.round(parseFloat(e)) } var i, o, a, s, u, l = r.createElement("div"), c = r.createElement("div"); c.style && (c.style.backgroundClip = "content-box", c.cloneNode(!0).style.backgroundClip = "", h.clearCloneStyle = "content-box" === c.style.backgroundClip, w.extend(h, { boxSizingReliable: function () { return t(), o }, pixelBoxStyles: function () { return t(), s }, pixelPosition: function () { return t(), i }, reliableMarginLeft: function () { return t(), u }, scrollboxSize: function () { return t(), a } })) }(); function Fe(e, t, n) { var r, i, o, a, s = e.style; return (n = n || $e(e)) && ("" !== (a = n.getPropertyValue(t) || n[t]) || w.contains(e.ownerDocument, e) || (a = w.style(e, t)), !h.pixelBoxStyles() && We.test(a) && Be.test(t) && (r = s.width, i = s.minWidth, o = s.maxWidth, s.minWidth = s.maxWidth = s.width = a, a = n.width, s.width = r, s.minWidth = i, s.maxWidth = o)), void 0 !== a ? a + "" : a } function _e(e, t) { return { get: function () { if (!e()) return (this.get = t).apply(this, arguments); delete this.get } } } var ze = /^(none|table(?!-c[ea]).+)/, Xe = /^--/, Ue = { position: "absolute", visibility: "hidden", display: "block" }, Ve = { letterSpacing: "0", fontWeight: "400" }, Ge = ["Webkit", "Moz", "ms"], Ye = r.createElement("div").style; function Qe(e) { if (e in Ye) return e; var t = e[0].toUpperCase() + e.slice(1), n = Ge.length; while (n--) if ((e = Ge[n] + t) in Ye) return e } function Je(e) { var t = w.cssProps[e]; return t || (t = w.cssProps[e] = Qe(e) || e), t } function Ke(e, t, n) { var r = ie.exec(t); return r ? Math.max(0, r[2] - (n || 0)) + (r[3] || "px") : t } function Ze(e, t, n, r, i, o) { var a = "width" === t ? 1 : 0, s = 0, u = 0; if (n === (r ? "border" : "content")) return 0; for (; a < 4; a += 2)"margin" === n && (u += w.css(e, n + oe[a], !0, i)), r ? ("content" === n && (u -= w.css(e, "padding" + oe[a], !0, i)), "margin" !== n && (u -= w.css(e, "border" + oe[a] + "Width", !0, i))) : (u += w.css(e, "padding" + oe[a], !0, i), "padding" !== n ? u += w.css(e, "border" + oe[a] + "Width", !0, i) : s += w.css(e, "border" + oe[a] + "Width", !0, i)); return !r && o >= 0 && (u += Math.max(0, Math.ceil(e["offset" + t[0].toUpperCase() + t.slice(1)] - o - u - s - .5))), u } function et(e, t, n) { var r = $e(e), i = Fe(e, t, r), o = "border-box" === w.css(e, "boxSizing", !1, r), a = o; if (We.test(i)) { if (!n) return i; i = "auto" } return a = a && (h.boxSizingReliable() || i === e.style[t]), ("auto" === i || !parseFloat(i) && "inline" === w.css(e, "display", !1, r)) && (i = e["offset" + t[0].toUpperCase() + t.slice(1)], a = !0), (i = parseFloat(i) || 0) + Ze(e, t, n || (o ? "border" : "content"), a, r, i) + "px" } w.extend({ cssHooks: { opacity: { get: function (e, t) { if (t) { var n = Fe(e, "opacity"); return "" === n ? "1" : n } } } }, cssNumber: { animationIterationCount: !0, columnCount: !0, fillOpacity: !0, flexGrow: !0, flexShrink: !0, fontWeight: !0, lineHeight: !0, opacity: !0, order: !0, orphans: !0, widows: !0, zIndex: !0, zoom: !0 }, cssProps: {}, style: function (e, t, n, r) { if (e && 3 !== e.nodeType && 8 !== e.nodeType && e.style) { var i, o, a, s = G(t), u = Xe.test(t), l = e.style; if (u || (t = Je(s)), a = w.cssHooks[t] || w.cssHooks[s], void 0 === n) return a && "get" in a && void 0 !== (i = a.get(e, !1, r)) ? i : l[t]; "string" == (o = typeof n) && (i = ie.exec(n)) && i[1] && (n = ue(e, t, i), o = "number"), null != n && n === n && ("number" === o && (n += i && i[3] || (w.cssNumber[s] ? "" : "px")), h.clearCloneStyle || "" !== n || 0 !== t.indexOf("background") || (l[t] = "inherit"), a && "set" in a && void 0 === (n = a.set(e, n, r)) || (u ? l.setProperty(t, n) : l[t] = n)) } }, css: function (e, t, n, r) { var i, o, a, s = G(t); return Xe.test(t) || (t = Je(s)), (a = w.cssHooks[t] || w.cssHooks[s]) && "get" in a && (i = a.get(e, !0, n)), void 0 === i && (i = Fe(e, t, r)), "normal" === i && t in Ve && (i = Ve[t]), "" === n || n ? (o = parseFloat(i), !0 === n || isFinite(o) ? o || 0 : i) : i } }), w.each(["height", "width"], function (e, t) { w.cssHooks[t] = { get: function (e, n, r) { if (n) return !ze.test(w.css(e, "display")) || e.getClientRects().length && e.getBoundingClientRect().width ? et(e, t, r) : se(e, Ue, function () { return et(e, t, r) }) }, set: function (e, n, r) { var i, o = $e(e), a = "border-box" === w.css(e, "boxSizing", !1, o), s = r && Ze(e, t, r, a, o); return a && h.scrollboxSize() === o.position && (s -= Math.ceil(e["offset" + t[0].toUpperCase() + t.slice(1)] - parseFloat(o[t]) - Ze(e, t, "border", !1, o) - .5)), s && (i = ie.exec(n)) && "px" !== (i[3] || "px") && (e.style[t] = n, n = w.css(e, t)), Ke(e, n, s) } } }), w.cssHooks.marginLeft = _e(h.reliableMarginLeft, function (e, t) { if (t) return (parseFloat(Fe(e, "marginLeft")) || e.getBoundingClientRect().left - se(e, { marginLeft: 0 }, function () { return e.getBoundingClientRect().left })) + "px" }), w.each({ margin: "", padding: "", border: "Width" }, function (e, t) { w.cssHooks[e + t] = { expand: function (n) { for (var r = 0, i = {}, o = "string" == typeof n ? n.split(" ") : [n]; r < 4; r++)i[e + oe[r] + t] = o[r] || o[r - 2] || o[0]; return i } }, "margin" !== e && (w.cssHooks[e + t].set = Ke) }), w.fn.extend({ css: function (e, t) { return z(this, function (e, t, n) { var r, i, o = {}, a = 0; if (Array.isArray(t)) { for (r = $e(e), i = t.length; a < i; a++)o[t[a]] = w.css(e, t[a], !1, r); return o } return void 0 !== n ? w.style(e, t, n) : w.css(e, t) }, e, t, arguments.length > 1) } }); function tt(e, t, n, r, i) { return new tt.prototype.init(e, t, n, r, i) } w.Tween = tt, tt.prototype = { constructor: tt, init: function (e, t, n, r, i, o) { this.elem = e, this.prop = n, this.easing = i || w.easing._default, this.options = t, this.start = this.now = this.cur(), this.end = r, this.unit = o || (w.cssNumber[n] ? "" : "px") }, cur: function () { var e = tt.propHooks[this.prop]; return e && e.get ? e.get(this) : tt.propHooks._default.get(this) }, run: function (e) { var t, n = tt.propHooks[this.prop]; return this.options.duration ? this.pos = t = w.easing[this.easing](e, this.options.duration * e, 0, 1, this.options.duration) : this.pos = t = e, this.now = (this.end - this.start) * t + this.start, this.options.step && this.options.step.call(this.elem, this.now, this), n && n.set ? n.set(this) : tt.propHooks._default.set(this), this } }, tt.prototype.init.prototype = tt.prototype, tt.propHooks = { _default: { get: function (e) { var t; return 1 !== e.elem.nodeType || null != e.elem[e.prop] && null == e.elem.style[e.prop] ? e.elem[e.prop] : (t = w.css(e.elem, e.prop, "")) && "auto" !== t ? t : 0 }, set: function (e) { w.fx.step[e.prop] ? w.fx.step[e.prop](e) : 1 !== e.elem.nodeType || null == e.elem.style[w.cssProps[e.prop]] && !w.cssHooks[e.prop] ? e.elem[e.prop] = e.now : w.style(e.elem, e.prop, e.now + e.unit) } } }, tt.propHooks.scrollTop = tt.propHooks.scrollLeft = { set: function (e) { e.elem.nodeType && e.elem.parentNode && (e.elem[e.prop] = e.now) } }, w.easing = { linear: function (e) { return e }, swing: function (e) { return .5 - Math.cos(e * Math.PI) / 2 }, _default: "swing" }, w.fx = tt.prototype.init, w.fx.step = {}; var nt, rt, it = /^(?:toggle|show|hide)$/, ot = /queueHooks$/; function at() { rt && (!1 === r.hidden && e.requestAnimationFrame ? e.requestAnimationFrame(at) : e.setTimeout(at, w.fx.interval), w.fx.tick()) } function st() { return e.setTimeout(function () { nt = void 0 }), nt = Date.now() } function ut(e, t) { var n, r = 0, i = { height: e }; for (t = t ? 1 : 0; r < 4; r += 2 - t)i["margin" + (n = oe[r])] = i["padding" + n] = e; return t && (i.opacity = i.width = e), i } function lt(e, t, n) { for (var r, i = (pt.tweeners[t] || []).concat(pt.tweeners["*"]), o = 0, a = i.length; o < a; o++)if (r = i[o].call(n, t, e)) return r } function ct(e, t, n) { var r, i, o, a, s, u, l, c, f = "width" in t || "height" in t, p = this, d = {}, h = e.style, g = e.nodeType && ae(e), y = J.get(e, "fxshow"); n.queue || (null == (a = w._queueHooks(e, "fx")).unqueued && (a.unqueued = 0, s = a.empty.fire, a.empty.fire = function () { a.unqueued || s() }), a.unqueued++ , p.always(function () { p.always(function () { a.unqueued-- , w.queue(e, "fx").length || a.empty.fire() }) })); for (r in t) if (i = t[r], it.test(i)) { if (delete t[r], o = o || "toggle" === i, i === (g ? "hide" : "show")) { if ("show" !== i || !y || void 0 === y[r]) continue; g = !0 } d[r] = y && y[r] || w.style(e, r) } if ((u = !w.isEmptyObject(t)) || !w.isEmptyObject(d)) { f && 1 === e.nodeType && (n.overflow = [h.overflow, h.overflowX, h.overflowY], null == (l = y && y.display) && (l = J.get(e, "display")), "none" === (c = w.css(e, "display")) && (l ? c = l : (fe([e], !0), l = e.style.display || l, c = w.css(e, "display"), fe([e]))), ("inline" === c || "inline-block" === c && null != l) && "none" === w.css(e, "float") && (u || (p.done(function () { h.display = l }), null == l && (c = h.display, l = "none" === c ? "" : c)), h.display = "inline-block")), n.overflow && (h.overflow = "hidden", p.always(function () { h.overflow = n.overflow[0], h.overflowX = n.overflow[1], h.overflowY = n.overflow[2] })), u = !1; for (r in d) u || (y ? "hidden" in y && (g = y.hidden) : y = J.access(e, "fxshow", { display: l }), o && (y.hidden = !g), g && fe([e], !0), p.done(function () { g || fe([e]), J.remove(e, "fxshow"); for (r in d) w.style(e, r, d[r]) })), u = lt(g ? y[r] : 0, r, p), r in y || (y[r] = u.start, g && (u.end = u.start, u.start = 0)) } } function ft(e, t) { var n, r, i, o, a; for (n in e) if (r = G(n), i = t[r], o = e[n], Array.isArray(o) && (i = o[1], o = e[n] = o[0]), n !== r && (e[r] = o, delete e[n]), (a = w.cssHooks[r]) && "expand" in a) { o = a.expand(o), delete e[r]; for (n in o) n in e || (e[n] = o[n], t[n] = i) } else t[r] = i } function pt(e, t, n) { var r, i, o = 0, a = pt.prefilters.length, s = w.Deferred().always(function () { delete u.elem }), u = function () { if (i) return !1; for (var t = nt || st(), n = Math.max(0, l.startTime + l.duration - t), r = 1 - (n / l.duration || 0), o = 0, a = l.tweens.length; o < a; o++)l.tweens[o].run(r); return s.notifyWith(e, [l, r, n]), r < 1 && a ? n : (a || s.notifyWith(e, [l, 1, 0]), s.resolveWith(e, [l]), !1) }, l = s.promise({ elem: e, props: w.extend({}, t), opts: w.extend(!0, { specialEasing: {}, easing: w.easing._default }, n), originalProperties: t, originalOptions: n, startTime: nt || st(), duration: n.duration, tweens: [], createTween: function (t, n) { var r = w.Tween(e, l.opts, t, n, l.opts.specialEasing[t] || l.opts.easing); return l.tweens.push(r), r }, stop: function (t) { var n = 0, r = t ? l.tweens.length : 0; if (i) return this; for (i = !0; n < r; n++)l.tweens[n].run(1); return t ? (s.notifyWith(e, [l, 1, 0]), s.resolveWith(e, [l, t])) : s.rejectWith(e, [l, t]), this } }), c = l.props; for (ft(c, l.opts.specialEasing); o < a; o++)if (r = pt.prefilters[o].call(l, e, c, l.opts)) return g(r.stop) && (w._queueHooks(l.elem, l.opts.queue).stop = r.stop.bind(r)), r; return w.map(c, lt, l), g(l.opts.start) && l.opts.start.call(e, l), l.progress(l.opts.progress).done(l.opts.done, l.opts.complete).fail(l.opts.fail).always(l.opts.always), w.fx.timer(w.extend(u, { elem: e, anim: l, queue: l.opts.queue })), l } w.Animation = w.extend(pt, { tweeners: { "*": [function (e, t) { var n = this.createTween(e, t); return ue(n.elem, e, ie.exec(t), n), n }] }, tweener: function (e, t) { g(e) ? (t = e, e = ["*"]) : e = e.match(M); for (var n, r = 0, i = e.length; r < i; r++)n = e[r], pt.tweeners[n] = pt.tweeners[n] || [], pt.tweeners[n].unshift(t) }, prefilters: [ct], prefilter: function (e, t) { t ? pt.prefilters.unshift(e) : pt.prefilters.push(e) } }), w.speed = function (e, t, n) { var r = e && "object" == typeof e ? w.extend({}, e) : { complete: n || !n && t || g(e) && e, duration: e, easing: n && t || t && !g(t) && t }; return w.fx.off ? r.duration = 0 : "number" != typeof r.duration && (r.duration in w.fx.speeds ? r.duration = w.fx.speeds[r.duration] : r.duration = w.fx.speeds._default), null != r.queue && !0 !== r.queue || (r.queue = "fx"), r.old = r.complete, r.complete = function () { g(r.old) && r.old.call(this), r.queue && w.dequeue(this, r.queue) }, r }, w.fn.extend({ fadeTo: function (e, t, n, r) { return this.filter(ae).css("opacity", 0).show().end().animate({ opacity: t }, e, n, r) }, animate: function (e, t, n, r) { var i = w.isEmptyObject(e), o = w.speed(t, n, r), a = function () { var t = pt(this, w.extend({}, e), o); (i || J.get(this, "finish")) && t.stop(!0) }; return a.finish = a, i || !1 === o.queue ? this.each(a) : this.queue(o.queue, a) }, stop: function (e, t, n) { var r = function (e) { var t = e.stop; delete e.stop, t(n) }; return "string" != typeof e && (n = t, t = e, e = void 0), t && !1 !== e && this.queue(e || "fx", []), this.each(function () { var t = !0, i = null != e && e + "queueHooks", o = w.timers, a = J.get(this); if (i) a[i] && a[i].stop && r(a[i]); else for (i in a) a[i] && a[i].stop && ot.test(i) && r(a[i]); for (i = o.length; i--;)o[i].elem !== this || null != e && o[i].queue !== e || (o[i].anim.stop(n), t = !1, o.splice(i, 1)); !t && n || w.dequeue(this, e) }) }, finish: function (e) { return !1 !== e && (e = e || "fx"), this.each(function () { var t, n = J.get(this), r = n[e + "queue"], i = n[e + "queueHooks"], o = w.timers, a = r ? r.length : 0; for (n.finish = !0, w.queue(this, e, []), i && i.stop && i.stop.call(this, !0), t = o.length; t--;)o[t].elem === this && o[t].queue === e && (o[t].anim.stop(!0), o.splice(t, 1)); for (t = 0; t < a; t++)r[t] && r[t].finish && r[t].finish.call(this); delete n.finish }) } }), w.each(["toggle", "show", "hide"], function (e, t) { var n = w.fn[t]; w.fn[t] = function (e, r, i) { return null == e || "boolean" == typeof e ? n.apply(this, arguments) : this.animate(ut(t, !0), e, r, i) } }), w.each({ slideDown: ut("show"), slideUp: ut("hide"), slideToggle: ut("toggle"), fadeIn: { opacity: "show" }, fadeOut: { opacity: "hide" }, fadeToggle: { opacity: "toggle" } }, function (e, t) { w.fn[e] = function (e, n, r) { return this.animate(t, e, n, r) } }), w.timers = [], w.fx.tick = function () { var e, t = 0, n = w.timers; for (nt = Date.now(); t < n.length; t++)(e = n[t])() || n[t] !== e || n.splice(t--, 1); n.length || w.fx.stop(), nt = void 0 }, w.fx.timer = function (e) { w.timers.push(e), w.fx.start() }, w.fx.interval = 13, w.fx.start = function () { rt || (rt = !0, at()) }, w.fx.stop = function () { rt = null }, w.fx.speeds = { slow: 600, fast: 200, _default: 400 }, w.fn.delay = function (t, n) { return t = w.fx ? w.fx.speeds[t] || t : t, n = n || "fx", this.queue(n, function (n, r) { var i = e.setTimeout(n, t); r.stop = function () { e.clearTimeout(i) } }) }, function () { var e = r.createElement("input"), t = r.createElement("select").appendChild(r.createElement("option")); e.type = "checkbox", h.checkOn = "" !== e.value, h.optSelected = t.selected, (e = r.createElement("input")).value = "t", e.type = "radio", h.radioValue = "t" === e.value }(); var dt, ht = w.expr.attrHandle; w.fn.extend({ attr: function (e, t) { return z(this, w.attr, e, t, arguments.length > 1) }, removeAttr: function (e) { return this.each(function () { w.removeAttr(this, e) }) } }), w.extend({ attr: function (e, t, n) { var r, i, o = e.nodeType; if (3 !== o && 8 !== o && 2 !== o) return "undefined" == typeof e.getAttribute ? w.prop(e, t, n) : (1 === o && w.isXMLDoc(e) || (i = w.attrHooks[t.toLowerCase()] || (w.expr.match.bool.test(t) ? dt : void 0)), void 0 !== n ? null === n ? void w.removeAttr(e, t) : i && "set" in i && void 0 !== (r = i.set(e, n, t)) ? r : (e.setAttribute(t, n + ""), n) : i && "get" in i && null !== (r = i.get(e, t)) ? r : null == (r = w.find.attr(e, t)) ? void 0 : r) }, attrHooks: { type: { set: function (e, t) { if (!h.radioValue && "radio" === t && N(e, "input")) { var n = e.value; return e.setAttribute("type", t), n && (e.value = n), t } } } }, removeAttr: function (e, t) { var n, r = 0, i = t && t.match(M); if (i && 1 === e.nodeType) while (n = i[r++]) e.removeAttribute(n) } }), dt = { set: function (e, t, n) { return !1 === t ? w.removeAttr(e, n) : e.setAttribute(n, n), n } }, w.each(w.expr.match.bool.source.match(/\w+/g), function (e, t) { var n = ht[t] || w.find.attr; ht[t] = function (e, t, r) { var i, o, a = t.toLowerCase(); return r || (o = ht[a], ht[a] = i, i = null != n(e, t, r) ? a : null, ht[a] = o), i } }); var gt = /^(?:input|select|textarea|button)$/i, yt = /^(?:a|area)$/i; w.fn.extend({ prop: function (e, t) { return z(this, w.prop, e, t, arguments.length > 1) }, removeProp: function (e) { return this.each(function () { delete this[w.propFix[e] || e] }) } }), w.extend({ prop: function (e, t, n) { var r, i, o = e.nodeType; if (3 !== o && 8 !== o && 2 !== o) return 1 === o && w.isXMLDoc(e) || (t = w.propFix[t] || t, i = w.propHooks[t]), void 0 !== n ? i && "set" in i && void 0 !== (r = i.set(e, n, t)) ? r : e[t] = n : i && "get" in i && null !== (r = i.get(e, t)) ? r : e[t] }, propHooks: { tabIndex: { get: function (e) { var t = w.find.attr(e, "tabindex"); return t ? parseInt(t, 10) : gt.test(e.nodeName) || yt.test(e.nodeName) && e.href ? 0 : -1 } } }, propFix: { "for": "htmlFor", "class": "className" } }), h.optSelected || (w.propHooks.selected = { get: function (e) { var t = e.parentNode; return t && t.parentNode && t.parentNode.selectedIndex, null }, set: function (e) { var t = e.parentNode; t && (t.selectedIndex, t.parentNode && t.parentNode.selectedIndex) } }), w.each(["tabIndex", "readOnly", "maxLength", "cellSpacing", "cellPadding", "rowSpan", "colSpan", "useMap", "frameBorder", "contentEditable"], function () { w.propFix[this.toLowerCase()] = this }); function vt(e) { return (e.match(M) || []).join(" ") } function mt(e) { return e.getAttribute && e.getAttribute("class") || "" } function xt(e) { return Array.isArray(e) ? e : "string" == typeof e ? e.match(M) || [] : [] } w.fn.extend({ addClass: function (e) { var t, n, r, i, o, a, s, u = 0; if (g(e)) return this.each(function (t) { w(this).addClass(e.call(this, t, mt(this))) }); if ((t = xt(e)).length) while (n = this[u++]) if (i = mt(n), r = 1 === n.nodeType && " " + vt(i) + " ") { a = 0; while (o = t[a++]) r.indexOf(" " + o + " ") < 0 && (r += o + " "); i !== (s = vt(r)) && n.setAttribute("class", s) } return this }, removeClass: function (e) { var t, n, r, i, o, a, s, u = 0; if (g(e)) return this.each(function (t) { w(this).removeClass(e.call(this, t, mt(this))) }); if (!arguments.length) return this.attr("class", ""); if ((t = xt(e)).length) while (n = this[u++]) if (i = mt(n), r = 1 === n.nodeType && " " + vt(i) + " ") { a = 0; while (o = t[a++]) while (r.indexOf(" " + o + " ") > -1) r = r.replace(" " + o + " ", " "); i !== (s = vt(r)) && n.setAttribute("class", s) } return this }, toggleClass: function (e, t) { var n = typeof e, r = "string" === n || Array.isArray(e); return "boolean" == typeof t && r ? t ? this.addClass(e) : this.removeClass(e) : g(e) ? this.each(function (n) { w(this).toggleClass(e.call(this, n, mt(this), t), t) }) : this.each(function () { var t, i, o, a; if (r) { i = 0, o = w(this), a = xt(e); while (t = a[i++]) o.hasClass(t) ? o.removeClass(t) : o.addClass(t) } else void 0 !== e && "boolean" !== n || ((t = mt(this)) && J.set(this, "__className__", t), this.setAttribute && this.setAttribute("class", t || !1 === e ? "" : J.get(this, "__className__") || "")) }) }, hasClass: function (e) { var t, n, r = 0; t = " " + e + " "; while (n = this[r++]) if (1 === n.nodeType && (" " + vt(mt(n)) + " ").indexOf(t) > -1) return !0; return !1 } }); var bt = /\r/g; w.fn.extend({ val: function (e) { var t, n, r, i = this[0]; { if (arguments.length) return r = g(e), this.each(function (n) { var i; 1 === this.nodeType && (null == (i = r ? e.call(this, n, w(this).val()) : e) ? i = "" : "number" == typeof i ? i += "" : Array.isArray(i) && (i = w.map(i, function (e) { return null == e ? "" : e + "" })), (t = w.valHooks[this.type] || w.valHooks[this.nodeName.toLowerCase()]) && "set" in t && void 0 !== t.set(this, i, "value") || (this.value = i)) }); if (i) return (t = w.valHooks[i.type] || w.valHooks[i.nodeName.toLowerCase()]) && "get" in t && void 0 !== (n = t.get(i, "value")) ? n : "string" == typeof (n = i.value) ? n.replace(bt, "") : null == n ? "" : n } } }), w.extend({ valHooks: { option: { get: function (e) { var t = w.find.attr(e, "value"); return null != t ? t : vt(w.text(e)) } }, select: { get: function (e) { var t, n, r, i = e.options, o = e.selectedIndex, a = "select-one" === e.type, s = a ? null : [], u = a ? o + 1 : i.length; for (r = o < 0 ? u : a ? o : 0; r < u; r++)if (((n = i[r]).selected || r === o) && !n.disabled && (!n.parentNode.disabled || !N(n.parentNode, "optgroup"))) { if (t = w(n).val(), a) return t; s.push(t) } return s }, set: function (e, t) { var n, r, i = e.options, o = w.makeArray(t), a = i.length; while (a--) ((r = i[a]).selected = w.inArray(w.valHooks.option.get(r), o) > -1) && (n = !0); return n || (e.selectedIndex = -1), o } } } }), w.each(["radio", "checkbox"], function () { w.valHooks[this] = { set: function (e, t) { if (Array.isArray(t)) return e.checked = w.inArray(w(e).val(), t) > -1 } }, h.checkOn || (w.valHooks[this].get = function (e) { return null === e.getAttribute("value") ? "on" : e.value }) }), h.focusin = "onfocusin" in e; var wt = /^(?:focusinfocus|focusoutblur)$/, Tt = function (e) { e.stopPropagation() }; w.extend(w.event, { trigger: function (t, n, i, o) { var a, s, u, l, c, p, d, h, v = [i || r], m = f.call(t, "type") ? t.type : t, x = f.call(t, "namespace") ? t.namespace.split(".") : []; if (s = h = u = i = i || r, 3 !== i.nodeType && 8 !== i.nodeType && !wt.test(m + w.event.triggered) && (m.indexOf(".") > -1 && (m = (x = m.split(".")).shift(), x.sort()), c = m.indexOf(":") < 0 && "on" + m, t = t[w.expando] ? t : new w.Event(m, "object" == typeof t && t), t.isTrigger = o ? 2 : 3, t.namespace = x.join("."), t.rnamespace = t.namespace ? new RegExp("(^|\\.)" + x.join("\\.(?:.*\\.|)") + "(\\.|$)") : null, t.result = void 0, t.target || (t.target = i), n = null == n ? [t] : w.makeArray(n, [t]), d = w.event.special[m] || {}, o || !d.trigger || !1 !== d.trigger.apply(i, n))) { if (!o && !d.noBubble && !y(i)) { for (l = d.delegateType || m, wt.test(l + m) || (s = s.parentNode); s; s = s.parentNode)v.push(s), u = s; u === (i.ownerDocument || r) && v.push(u.defaultView || u.parentWindow || e) } a = 0; while ((s = v[a++]) && !t.isPropagationStopped()) h = s, t.type = a > 1 ? l : d.bindType || m, (p = (J.get(s, "events") || {})[t.type] && J.get(s, "handle")) && p.apply(s, n), (p = c && s[c]) && p.apply && Y(s) && (t.result = p.apply(s, n), !1 === t.result && t.preventDefault()); return t.type = m, o || t.isDefaultPrevented() || d._default && !1 !== d._default.apply(v.pop(), n) || !Y(i) || c && g(i[m]) && !y(i) && ((u = i[c]) && (i[c] = null), w.event.triggered = m, t.isPropagationStopped() && h.addEventListener(m, Tt), i[m](), t.isPropagationStopped() && h.removeEventListener(m, Tt), w.event.triggered = void 0, u && (i[c] = u)), t.result } }, simulate: function (e, t, n) { var r = w.extend(new w.Event, n, { type: e, isSimulated: !0 }); w.event.trigger(r, null, t) } }), w.fn.extend({ trigger: function (e, t) { return this.each(function () { w.event.trigger(e, t, this) }) }, triggerHandler: function (e, t) { var n = this[0]; if (n) return w.event.trigger(e, t, n, !0) } }), h.focusin || w.each({ focus: "focusin", blur: "focusout" }, function (e, t) { var n = function (e) { w.event.simulate(t, e.target, w.event.fix(e)) }; w.event.special[t] = { setup: function () { var r = this.ownerDocument || this, i = J.access(r, t); i || r.addEventListener(e, n, !0), J.access(r, t, (i || 0) + 1) }, teardown: function () { var r = this.ownerDocument || this, i = J.access(r, t) - 1; i ? J.access(r, t, i) : (r.removeEventListener(e, n, !0), J.remove(r, t)) } } }); var Ct = e.location, Et = Date.now(), kt = /\?/; w.parseXML = function (t) { var n; if (!t || "string" != typeof t) return null; try { n = (new e.DOMParser).parseFromString(t, "text/xml") } catch (e) { n = void 0 } return n && !n.getElementsByTagName("parsererror").length || w.error("Invalid XML: " + t), n }; var St = /\[\]$/, Dt = /\r?\n/g, Nt = /^(?:submit|button|image|reset|file)$/i, At = /^(?:input|select|textarea|keygen)/i; function jt(e, t, n, r) { var i; if (Array.isArray(t)) w.each(t, function (t, i) { n || St.test(e) ? r(e, i) : jt(e + "[" + ("object" == typeof i && null != i ? t : "") + "]", i, n, r) }); else if (n || "object" !== x(t)) r(e, t); else for (i in t) jt(e + "[" + i + "]", t[i], n, r) } w.param = function (e, t) { var n, r = [], i = function (e, t) { var n = g(t) ? t() : t; r[r.length] = encodeURIComponent(e) + "=" + encodeURIComponent(null == n ? "" : n) }; if (Array.isArray(e) || e.jquery && !w.isPlainObject(e)) w.each(e, function () { i(this.name, this.value) }); else for (n in e) jt(n, e[n], t, i); return r.join("&") }, w.fn.extend({ serialize: function () { return w.param(this.serializeArray()) }, serializeArray: function () { return this.map(function () { var e = w.prop(this, "elements"); return e ? w.makeArray(e) : this }).filter(function () { var e = this.type; return this.name && !w(this).is(":disabled") && At.test(this.nodeName) && !Nt.test(e) && (this.checked || !pe.test(e)) }).map(function (e, t) { var n = w(this).val(); return null == n ? null : Array.isArray(n) ? w.map(n, function (e) { return { name: t.name, value: e.replace(Dt, "\r\n") } }) : { name: t.name, value: n.replace(Dt, "\r\n") } }).get() } }); var qt = /%20/g, Lt = /#.*$/, Ht = /([?&])_=[^&]*/, Ot = /^(.*?):[ \t]*([^\r\n]*)$/gm, Pt = /^(?:about|app|app-storage|.+-extension|file|res|widget):$/, Mt = /^(?:GET|HEAD)$/, Rt = /^\/\//, It = {}, Wt = {}, $t = "*/".concat("*"), Bt = r.createElement("a"); Bt.href = Ct.href; function Ft(e) { return function (t, n) { "string" != typeof t && (n = t, t = "*"); var r, i = 0, o = t.toLowerCase().match(M) || []; if (g(n)) while (r = o[i++]) "+" === r[0] ? (r = r.slice(1) || "*", (e[r] = e[r] || []).unshift(n)) : (e[r] = e[r] || []).push(n) } } function _t(e, t, n, r) { var i = {}, o = e === Wt; function a(s) { var u; return i[s] = !0, w.each(e[s] || [], function (e, s) { var l = s(t, n, r); return "string" != typeof l || o || i[l] ? o ? !(u = l) : void 0 : (t.dataTypes.unshift(l), a(l), !1) }), u } return a(t.dataTypes[0]) || !i["*"] && a("*") } function zt(e, t) { var n, r, i = w.ajaxSettings.flatOptions || {}; for (n in t) void 0 !== t[n] && ((i[n] ? e : r || (r = {}))[n] = t[n]); return r && w.extend(!0, e, r), e } function Xt(e, t, n) { var r, i, o, a, s = e.contents, u = e.dataTypes; while ("*" === u[0]) u.shift(), void 0 === r && (r = e.mimeType || t.getResponseHeader("Content-Type")); if (r) for (i in s) if (s[i] && s[i].test(r)) { u.unshift(i); break } if (u[0] in n) o = u[0]; else { for (i in n) { if (!u[0] || e.converters[i + " " + u[0]]) { o = i; break } a || (a = i) } o = o || a } if (o) return o !== u[0] && u.unshift(o), n[o] } function Ut(e, t, n, r) { var i, o, a, s, u, l = {}, c = e.dataTypes.slice(); if (c[1]) for (a in e.converters) l[a.toLowerCase()] = e.converters[a]; o = c.shift(); while (o) if (e.responseFields[o] && (n[e.responseFields[o]] = t), !u && r && e.dataFilter && (t = e.dataFilter(t, e.dataType)), u = o, o = c.shift()) if ("*" === o) o = u; else if ("*" !== u && u !== o) { if (!(a = l[u + " " + o] || l["* " + o])) for (i in l) if ((s = i.split(" "))[1] === o && (a = l[u + " " + s[0]] || l["* " + s[0]])) { !0 === a ? a = l[i] : !0 !== l[i] && (o = s[0], c.unshift(s[1])); break } if (!0 !== a) if (a && e["throws"]) t = a(t); else try { t = a(t) } catch (e) { return { state: "parsererror", error: a ? e : "No conversion from " + u + " to " + o } } } return { state: "success", data: t } } w.extend({ active: 0, lastModified: {}, etag: {}, ajaxSettings: { url: Ct.href, type: "GET", isLocal: Pt.test(Ct.protocol), global: !0, processData: !0, async: !0, contentType: "application/x-www-form-urlencoded; charset=UTF-8", accepts: { "*": $t, text: "text/plain", html: "text/html", xml: "application/xml, text/xml", json: "application/json, text/javascript" }, contents: { xml: /\bxml\b/, html: /\bhtml/, json: /\bjson\b/ }, responseFields: { xml: "responseXML", text: "responseText", json: "responseJSON" }, converters: { "* text": String, "text html": !0, "text json": JSON.parse, "text xml": w.parseXML }, flatOptions: { url: !0, context: !0 } }, ajaxSetup: function (e, t) { return t ? zt(zt(e, w.ajaxSettings), t) : zt(w.ajaxSettings, e) }, ajaxPrefilter: Ft(It), ajaxTransport: Ft(Wt), ajax: function (t, n) { "object" == typeof t && (n = t, t = void 0), n = n || {}; var i, o, a, s, u, l, c, f, p, d, h = w.ajaxSetup({}, n), g = h.context || h, y = h.context && (g.nodeType || g.jquery) ? w(g) : w.event, v = w.Deferred(), m = w.Callbacks("once memory"), x = h.statusCode || {}, b = {}, T = {}, C = "canceled", E = { readyState: 0, getResponseHeader: function (e) { var t; if (c) { if (!s) { s = {}; while (t = Ot.exec(a)) s[t[1].toLowerCase()] = t[2] } t = s[e.toLowerCase()] } return null == t ? null : t }, getAllResponseHeaders: function () { return c ? a : null }, setRequestHeader: function (e, t) { return null == c && (e = T[e.toLowerCase()] = T[e.toLowerCase()] || e, b[e] = t), this }, overrideMimeType: function (e) { return null == c && (h.mimeType = e), this }, statusCode: function (e) { var t; if (e) if (c) E.always(e[E.status]); else for (t in e) x[t] = [x[t], e[t]]; return this }, abort: function (e) { var t = e || C; return i && i.abort(t), k(0, t), this } }; if (v.promise(E), h.url = ((t || h.url || Ct.href) + "").replace(Rt, Ct.protocol + "//"), h.type = n.method || n.type || h.method || h.type, h.dataTypes = (h.dataType || "*").toLowerCase().match(M) || [""], null == h.crossDomain) { l = r.createElement("a"); try { l.href = h.url, l.href = l.href, h.crossDomain = Bt.protocol + "//" + Bt.host != l.protocol + "//" + l.host } catch (e) { h.crossDomain = !0 } } if (h.data && h.processData && "string" != typeof h.data && (h.data = w.param(h.data, h.traditional)), _t(It, h, n, E), c) return E; (f = w.event && h.global) && 0 == w.active++ && w.event.trigger("ajaxStart"), h.type = h.type.toUpperCase(), h.hasContent = !Mt.test(h.type), o = h.url.replace(Lt, ""), h.hasContent ? h.data && h.processData && 0 === (h.contentType || "").indexOf("application/x-www-form-urlencoded") && (h.data = h.data.replace(qt, "+")) : (d = h.url.slice(o.length), h.data && (h.processData || "string" == typeof h.data) && (o += (kt.test(o) ? "&" : "?") + h.data, delete h.data), !1 === h.cache && (o = o.replace(Ht, "$1"), d = (kt.test(o) ? "&" : "?") + "_=" + Et++ + d), h.url = o + d), h.ifModified && (w.lastModified[o] && E.setRequestHeader("If-Modified-Since", w.lastModified[o]), w.etag[o] && E.setRequestHeader("If-None-Match", w.etag[o])), (h.data && h.hasContent && !1 !== h.contentType || n.contentType) && E.setRequestHeader("Content-Type", h.contentType), E.setRequestHeader("Accept", h.dataTypes[0] && h.accepts[h.dataTypes[0]] ? h.accepts[h.dataTypes[0]] + ("*" !== h.dataTypes[0] ? ", " + $t + "; q=0.01" : "") : h.accepts["*"]); for (p in h.headers) E.setRequestHeader(p, h.headers[p]); if (h.beforeSend && (!1 === h.beforeSend.call(g, E, h) || c)) return E.abort(); if (C = "abort", m.add(h.complete), E.done(h.success), E.fail(h.error), i = _t(Wt, h, n, E)) { if (E.readyState = 1, f && y.trigger("ajaxSend", [E, h]), c) return E; h.async && h.timeout > 0 && (u = e.setTimeout(function () { E.abort("timeout") }, h.timeout)); try { c = !1, i.send(b, k) } catch (e) { if (c) throw e; k(-1, e) } } else k(-1, "No Transport"); function k(t, n, r, s) { var l, p, d, b, T, C = n; c || (c = !0, u && e.clearTimeout(u), i = void 0, a = s || "", E.readyState = t > 0 ? 4 : 0, l = t >= 200 && t < 300 || 304 === t, r && (b = Xt(h, E, r)), b = Ut(h, b, E, l), l ? (h.ifModified && ((T = E.getResponseHeader("Last-Modified")) && (w.lastModified[o] = T), (T = E.getResponseHeader("etag")) && (w.etag[o] = T)), 204 === t || "HEAD" === h.type ? C = "nocontent" : 304 === t ? C = "notmodified" : (C = b.state, p = b.data, l = !(d = b.error))) : (d = C, !t && C || (C = "error", t < 0 && (t = 0))), E.status = t, E.statusText = (n || C) + "", l ? v.resolveWith(g, [p, C, E]) : v.rejectWith(g, [E, C, d]), E.statusCode(x), x = void 0, f && y.trigger(l ? "ajaxSuccess" : "ajaxError", [E, h, l ? p : d]), m.fireWith(g, [E, C]), f && (y.trigger("ajaxComplete", [E, h]), --w.active || w.event.trigger("ajaxStop"))) } return E }, getJSON: function (e, t, n) { return w.get(e, t, n, "json") }, getScript: function (e, t) { return w.get(e, void 0, t, "script") } }), w.each(["get", "post"], function (e, t) { w[t] = function (e, n, r, i) { return g(n) && (i = i || r, r = n, n = void 0), w.ajax(w.extend({ url: e, type: t, dataType: i, data: n, success: r }, w.isPlainObject(e) && e)) } }), w._evalUrl = function (e) { return w.ajax({ url: e, type: "GET", dataType: "script", cache: !0, async: !1, global: !1, "throws": !0 }) }, w.fn.extend({ wrapAll: function (e) { var t; return this[0] && (g(e) && (e = e.call(this[0])), t = w(e, this[0].ownerDocument).eq(0).clone(!0), this[0].parentNode && t.insertBefore(this[0]), t.map(function () { var e = this; while (e.firstElementChild) e = e.firstElementChild; return e }).append(this)), this }, wrapInner: function (e) { return g(e) ? this.each(function (t) { w(this).wrapInner(e.call(this, t)) }) : this.each(function () { var t = w(this), n = t.contents(); n.length ? n.wrapAll(e) : t.append(e) }) }, wrap: function (e) { var t = g(e); return this.each(function (n) { w(this).wrapAll(t ? e.call(this, n) : e) }) }, unwrap: function (e) { return this.parent(e).not("body").each(function () { w(this).replaceWith(this.childNodes) }), this } }), w.expr.pseudos.hidden = function (e) { return !w.expr.pseudos.visible(e) }, w.expr.pseudos.visible = function (e) { return !!(e.offsetWidth || e.offsetHeight || e.getClientRects().length) }, w.ajaxSettings.xhr = function () { try { return new e.XMLHttpRequest } catch (e) { } }; var Vt = { 0: 200, 1223: 204 }, Gt = w.ajaxSettings.xhr(); h.cors = !!Gt && "withCredentials" in Gt, h.ajax = Gt = !!Gt, w.ajaxTransport(function (t) { var n, r; if (h.cors || Gt && !t.crossDomain) return { send: function (i, o) { var a, s = t.xhr(); if (s.open(t.type, t.url, t.async, t.username, t.password), t.xhrFields) for (a in t.xhrFields) s[a] = t.xhrFields[a]; t.mimeType && s.overrideMimeType && s.overrideMimeType(t.mimeType), t.crossDomain || i["X-Requested-With"] || (i["X-Requested-With"] = "XMLHttpRequest"); for (a in i) s.setRequestHeader(a, i[a]); n = function (e) { return function () { n && (n = r = s.onload = s.onerror = s.onabort = s.ontimeout = s.onreadystatechange = null, "abort" === e ? s.abort() : "error" === e ? "number" != typeof s.status ? o(0, "error") : o(s.status, s.statusText) : o(Vt[s.status] || s.status, s.statusText, "text" !== (s.responseType || "text") || "string" != typeof s.responseText ? { binary: s.response } : { text: s.responseText }, s.getAllResponseHeaders())) } }, s.onload = n(), r = s.onerror = s.ontimeout = n("error"), void 0 !== s.onabort ? s.onabort = r : s.onreadystatechange = function () { 4 === s.readyState && e.setTimeout(function () { n && r() }) }, n = n("abort"); try { s.send(t.hasContent && t.data || null) } catch (e) { if (n) throw e } }, abort: function () { n && n() } } }), w.ajaxPrefilter(function (e) { e.crossDomain && (e.contents.script = !1) }), w.ajaxSetup({ accepts: { script: "text/javascript, application/javascript, application/ecmascript, application/x-ecmascript" }, contents: { script: /\b(?:java|ecma)script\b/ }, converters: { "text script": function (e) { return w.globalEval(e), e } } }), w.ajaxPrefilter("script", function (e) { void 0 === e.cache && (e.cache = !1), e.crossDomain && (e.type = "GET") }), w.ajaxTransport("script", function (e) { if (e.crossDomain) { var t, n; return { send: function (i, o) { t = w("<script>").prop({ charset: e.scriptCharset, src: e.url }).on("load error", n = function (e) { t.remove(), n = null, e && o("error" === e.type ? 404 : 200, e.type) }), r.head.appendChild(t[0]) }, abort: function () { n && n() } } } }); var Yt = [], Qt = /(=)\?(?=&|$)|\?\?/; w.ajaxSetup({ jsonp: "callback", jsonpCallback: function () { var e = Yt.pop() || w.expando + "_" + Et++; return this[e] = !0, e } }), w.ajaxPrefilter("json jsonp", function (t, n, r) { var i, o, a, s = !1 !== t.jsonp && (Qt.test(t.url) ? "url" : "string" == typeof t.data && 0 === (t.contentType || "").indexOf("application/x-www-form-urlencoded") && Qt.test(t.data) && "data"); if (s || "jsonp" === t.dataTypes[0]) return i = t.jsonpCallback = g(t.jsonpCallback) ? t.jsonpCallback() : t.jsonpCallback, s ? t[s] = t[s].replace(Qt, "$1" + i) : !1 !== t.jsonp && (t.url += (kt.test(t.url) ? "&" : "?") + t.jsonp + "=" + i), t.converters["script json"] = function () { return a || w.error(i + " was not called"), a[0] }, t.dataTypes[0] = "json", o = e[i], e[i] = function () { a = arguments }, r.always(function () { void 0 === o ? w(e).removeProp(i) : e[i] = o, t[i] && (t.jsonpCallback = n.jsonpCallback, Yt.push(i)), a && g(o) && o(a[0]), a = o = void 0 }), "script" }), h.createHTMLDocument = function () { var e = r.implementation.createHTMLDocument("").body; return e.innerHTML = "<form></form><form></form>", 2 === e.childNodes.length }(), w.parseHTML = function (e, t, n) { if ("string" != typeof e) return []; "boolean" == typeof t && (n = t, t = !1); var i, o, a; return t || (h.createHTMLDocument ? ((i = (t = r.implementation.createHTMLDocument("")).createElement("base")).href = r.location.href, t.head.appendChild(i)) : t = r), o = A.exec(e), a = !n && [], o ? [t.createElement(o[1])] : (o = xe([e], t, a), a && a.length && w(a).remove(), w.merge([], o.childNodes)) }, w.fn.load = function (e, t, n) { var r, i, o, a = this, s = e.indexOf(" "); return s > -1 && (r = vt(e.slice(s)), e = e.slice(0, s)), g(t) ? (n = t, t = void 0) : t && "object" == typeof t && (i = "POST"), a.length > 0 && w.ajax({ url: e, type: i || "GET", dataType: "html", data: t }).done(function (e) { o = arguments, a.html(r ? w("<div>").append(w.parseHTML(e)).find(r) : e) }).always(n && function (e, t) { a.each(function () { n.apply(this, o || [e.responseText, t, e]) }) }), this }, w.each(["ajaxStart", "ajaxStop", "ajaxComplete", "ajaxError", "ajaxSuccess", "ajaxSend"], function (e, t) { w.fn[t] = function (e) { return this.on(t, e) } }), w.expr.pseudos.animated = function (e) { return w.grep(w.timers, function (t) { return e === t.elem }).length }, w.offset = { setOffset: function (e, t, n) { var r, i, o, a, s, u, l, c = w.css(e, "position"), f = w(e), p = {}; "static" === c && (e.style.position = "relative"), s = f.offset(), o = w.css(e, "top"), u = w.css(e, "left"), (l = ("absolute" === c || "fixed" === c) && (o + u).indexOf("auto") > -1) ? (a = (r = f.position()).top, i = r.left) : (a = parseFloat(o) || 0, i = parseFloat(u) || 0), g(t) && (t = t.call(e, n, w.extend({}, s))), null != t.top && (p.top = t.top - s.top + a), null != t.left && (p.left = t.left - s.left + i), "using" in t ? t.using.call(e, p) : f.css(p) } }, w.fn.extend({ offset: function (e) { if (arguments.length) return void 0 === e ? this : this.each(function (t) { w.offset.setOffset(this, e, t) }); var t, n, r = this[0]; if (r) return r.getClientRects().length ? (t = r.getBoundingClientRect(), n = r.ownerDocument.defaultView, { top: t.top + n.pageYOffset, left: t.left + n.pageXOffset }) : { top: 0, left: 0 } }, position: function () { if (this[0]) { var e, t, n, r = this[0], i = { top: 0, left: 0 }; if ("fixed" === w.css(r, "position")) t = r.getBoundingClientRect(); else { t = this.offset(), n = r.ownerDocument, e = r.offsetParent || n.documentElement; while (e && (e === n.body || e === n.documentElement) && "static" === w.css(e, "position")) e = e.parentNode; e && e !== r && 1 === e.nodeType && ((i = w(e).offset()).top += w.css(e, "borderTopWidth", !0), i.left += w.css(e, "borderLeftWidth", !0)) } return { top: t.top - i.top - w.css(r, "marginTop", !0), left: t.left - i.left - w.css(r, "marginLeft", !0) } } }, offsetParent: function () { return this.map(function () { var e = this.offsetParent; while (e && "static" === w.css(e, "position")) e = e.offsetParent; return e || be }) } }), w.each({ scrollLeft: "pageXOffset", scrollTop: "pageYOffset" }, function (e, t) { var n = "pageYOffset" === t; w.fn[e] = function (r) { return z(this, function (e, r, i) { var o; if (y(e) ? o = e : 9 === e.nodeType && (o = e.defaultView), void 0 === i) return o ? o[t] : e[r]; o ? o.scrollTo(n ? o.pageXOffset : i, n ? i : o.pageYOffset) : e[r] = i }, e, r, arguments.length) } }), w.each(["top", "left"], function (e, t) { w.cssHooks[t] = _e(h.pixelPosition, function (e, n) { if (n) return n = Fe(e, t), We.test(n) ? w(e).position()[t] + "px" : n }) }), w.each({ Height: "height", Width: "width" }, function (e, t) { w.each({ padding: "inner" + e, content: t, "": "outer" + e }, function (n, r) { w.fn[r] = function (i, o) { var a = arguments.length && (n || "boolean" != typeof i), s = n || (!0 === i || !0 === o ? "margin" : "border"); return z(this, function (t, n, i) { var o; return y(t) ? 0 === r.indexOf("outer") ? t["inner" + e] : t.document.documentElement["client" + e] : 9 === t.nodeType ? (o = t.documentElement, Math.max(t.body["scroll" + e], o["scroll" + e], t.body["offset" + e], o["offset" + e], o["client" + e])) : void 0 === i ? w.css(t, n, s) : w.style(t, n, i, s) }, t, a ? i : void 0, a) } }) }), w.each("blur focus focusin focusout resize scroll click dblclick mousedown mouseup mousemove mouseover mouseout mouseenter mouseleave change select submit keydown keypress keyup contextmenu".split(" "), function (e, t) { w.fn[t] = function (e, n) { return arguments.length > 0 ? this.on(t, null, e, n) : this.trigger(t) } }), w.fn.extend({ hover: function (e, t) { return this.mouseenter(e).mouseleave(t || e) } }), w.fn.extend({ bind: function (e, t, n) { return this.on(e, null, t, n) }, unbind: function (e, t) { return this.off(e, null, t) }, delegate: function (e, t, n, r) { return this.on(t, e, n, r) }, undelegate: function (e, t, n) { return 1 === arguments.length ? this.off(e, "**") : this.off(t, e || "**", n) } }), w.proxy = function (e, t) { var n, r, i; if ("string" == typeof t && (n = e[t], t = e, e = n), g(e)) return r = o.call(arguments, 2), i = function () { return e.apply(t || this, r.concat(o.call(arguments))) }, i.guid = e.guid = e.guid || w.guid++ , i }, w.holdReady = function (e) { e ? w.readyWait++ : w.ready(!0) }, w.isArray = Array.isArray, w.parseJSON = JSON.parse, w.nodeName = N, w.isFunction = g, w.isWindow = y, w.camelCase = G, w.type = x, w.now = Date.now, w.isNumeric = function (e) { var t = w.type(e); return ("number" === t || "string" === t) && !isNaN(e - parseFloat(e)) }, "function" == typeof define && define.amd && define("jquery", [], function () { return w }); var Jt = e.jQuery, Kt = e.$; return w.noConflict = function (t) { return e.$ === w && (e.$ = Kt), t && e.jQuery === w && (e.jQuery = Jt), w }, t || (e.jQuery = e.$ = w), w });
\ No newline at end of file
diff --git a/plugins/search/fuse.min.js b/plugins/search/fuse.min.js
new file mode 100644
index 00000000..7bd82e19
--- /dev/null
+++ b/plugins/search/fuse.min.js
@@ -0,0 +1,9 @@
+/*!
+ * Fuse.js v3.2.0 - Lightweight fuzzy-search (http://fusejs.io)
+ * 
+ * Copyright (c) 2012-2017 Kirollos Risk (http://kiro.me)
+ * All Rights Reserved. Apache Software License 2.0
+ * 
+ * http://www.apache.org/licenses/LICENSE-2.0
+ */
+!function(e,t){"object"==typeof exports&&"object"==typeof module?module.exports=t():"function"==typeof define&&define.amd?define("Fuse",[],t):"object"==typeof exports?exports.Fuse=t():e.Fuse=t()}(this,function(){return function(e){function t(n){if(r[n])return r[n].exports;var o=r[n]={i:n,l:!1,exports:{}};return e[n].call(o.exports,o,o.exports,t),o.l=!0,o.exports}var r={};return t.m=e,t.c=r,t.i=function(e){return e},t.d=function(e,r,n){t.o(e,r)||Object.defineProperty(e,r,{configurable:!1,enumerable:!0,get:n})},t.n=function(e){var r=e&&e.__esModule?function(){return e.default}:function(){return e};return t.d(r,"a",r),r},t.o=function(e,t){return Object.prototype.hasOwnProperty.call(e,t)},t.p="",t(t.s=8)}([function(e,t,r){"use strict";e.exports=function(e){return"[object Array]"===Object.prototype.toString.call(e)}},function(e,t,r){"use strict";function n(e,t){if(!(e instanceof t))throw new TypeError("Cannot call a class as a function")}var o=function(){function e(e,t){for(var r=0;r<t.length;r++){var n=t[r];n.enumerable=n.enumerable||!1,n.configurable=!0,"value"in n&&(n.writable=!0),Object.defineProperty(e,n.key,n)}}return function(t,r,n){return r&&e(t.prototype,r),n&&e(t,n),t}}(),i=r(5),a=r(7),s=r(4),c=function(){function e(t,r){var o=r.location,i=void 0===o?0:o,a=r.distance,c=void 0===a?100:a,h=r.threshold,l=void 0===h?.6:h,u=r.maxPatternLength,f=void 0===u?32:u,d=r.isCaseSensitive,v=void 0!==d&&d,p=r.tokenSeparator,g=void 0===p?/ +/g:p,y=r.findAllMatches,m=void 0!==y&&y,k=r.minMatchCharLength,x=void 0===k?1:k;n(this,e),this.options={location:i,distance:c,threshold:l,maxPatternLength:f,isCaseSensitive:v,tokenSeparator:g,findAllMatches:m,minMatchCharLength:x},this.pattern=this.options.isCaseSensitive?t:t.toLowerCase(),this.pattern.length<=f&&(this.patternAlphabet=s(this.pattern))}return o(e,[{key:"search",value:function(e){if(this.options.isCaseSensitive||(e=e.toLowerCase()),this.pattern===e)return{isMatch:!0,score:0,matchedIndices:[[0,e.length-1]]};var t=this.options,r=t.maxPatternLength,n=t.tokenSeparator;if(this.pattern.length>r)return i(e,this.pattern,n);var o=this.options,s=o.location,c=o.distance,h=o.threshold,l=o.findAllMatches,u=o.minMatchCharLength;return a(e,this.pattern,this.patternAlphabet,{location:s,distance:c,threshold:h,findAllMatches:l,minMatchCharLength:u})}}]),e}();e.exports=c},function(e,t,r){"use strict";var n=r(0),o=function e(t,r,o){if(r){var i=r.indexOf("."),a=r,s=null;-1!==i&&(a=r.slice(0,i),s=r.slice(i+1));var c=t[a];if(null!==c&&void 0!==c)if(s||"string"!=typeof c&&"number"!=typeof c)if(n(c))for(var h=0,l=c.length;h<l;h+=1)e(c[h],s,o);else s&&e(c,s,o);else o.push(c.toString())}else o.push(t);return o};e.exports=function(e,t){return o(e,t,[])}},function(e,t,r){"use strict";e.exports=function(){for(var e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:[],t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:1,r=[],n=-1,o=-1,i=0,a=e.length;i<a;i+=1){var s=e[i];s&&-1===n?n=i:s||-1===n||(o=i-1,o-n+1>=t&&r.push([n,o]),n=-1)}return e[i-1]&&i-n>=t&&r.push([n,i-1]),r}},function(e,t,r){"use strict";e.exports=function(e){for(var t={},r=e.length,n=0;n<r;n+=1)t[e.charAt(n)]=0;for(var o=0;o<r;o+=1)t[e.charAt(o)]|=1<<r-o-1;return t}},function(e,t,r){"use strict";e.exports=function(e,t){var r=arguments.length>2&&void 0!==arguments[2]?arguments[2]:/ +/g,n=new RegExp(t.replace(/[\-\[\]\/\{\}\(\)\*\+\?\.\\\^\$\|]/g,"\\$&").replace(r,"|")),o=e.match(n),i=!!o,a=[];if(i)for(var s=0,c=o.length;s<c;s+=1){var h=o[s];a.push([e.indexOf(h),h.length-1])}return{score:i?.5:1,isMatch:i,matchedIndices:a}}},function(e,t,r){"use strict";e.exports=function(e,t){var r=t.errors,n=void 0===r?0:r,o=t.currentLocation,i=void 0===o?0:o,a=t.expectedLocation,s=void 0===a?0:a,c=t.distance,h=void 0===c?100:c,l=n/e.length,u=Math.abs(s-i);return h?l+u/h:u?1:l}},function(e,t,r){"use strict";var n=r(6),o=r(3);e.exports=function(e,t,r,i){for(var a=i.location,s=void 0===a?0:a,c=i.distance,h=void 0===c?100:c,l=i.threshold,u=void 0===l?.6:l,f=i.findAllMatches,d=void 0!==f&&f,v=i.minMatchCharLength,p=void 0===v?1:v,g=s,y=e.length,m=u,k=e.indexOf(t,g),x=t.length,S=[],M=0;M<y;M+=1)S[M]=0;if(-1!==k){var b=n(t,{errors:0,currentLocation:k,expectedLocation:g,distance:h});if(m=Math.min(b,m),-1!==(k=e.lastIndexOf(t,g+x))){var _=n(t,{errors:0,currentLocation:k,expectedLocation:g,distance:h});m=Math.min(_,m)}}k=-1;for(var L=[],w=1,C=x+y,A=1<<x-1,I=0;I<x;I+=1){for(var O=0,F=C;O<F;){n(t,{errors:I,currentLocation:g+F,expectedLocation:g,distance:h})<=m?O=F:C=F,F=Math.floor((C-O)/2+O)}C=F;var P=Math.max(1,g-F+1),j=d?y:Math.min(g+F,y)+x,z=Array(j+2);z[j+1]=(1<<I)-1;for(var T=j;T>=P;T-=1){var E=T-1,K=r[e.charAt(E)];if(K&&(S[E]=1),z[T]=(z[T+1]<<1|1)&K,0!==I&&(z[T]|=(L[T+1]|L[T])<<1|1|L[T+1]),z[T]&A&&(w=n(t,{errors:I,currentLocation:E,expectedLocation:g,distance:h}))<=m){if(m=w,(k=E)<=g)break;P=Math.max(1,2*g-k)}}if(n(t,{errors:I+1,currentLocation:g,expectedLocation:g,distance:h})>m)break;L=z}return{isMatch:k>=0,score:0===w?.001:w,matchedIndices:o(S,p)}}},function(e,t,r){"use strict";function n(e,t){if(!(e instanceof t))throw new TypeError("Cannot call a class as a function")}var o=function(){function e(e,t){for(var r=0;r<t.length;r++){var n=t[r];n.enumerable=n.enumerable||!1,n.configurable=!0,"value"in n&&(n.writable=!0),Object.defineProperty(e,n.key,n)}}return function(t,r,n){return r&&e(t.prototype,r),n&&e(t,n),t}}(),i=r(1),a=r(2),s=r(0),c=function(){function e(t,r){var o=r.location,i=void 0===o?0:o,s=r.distance,c=void 0===s?100:s,h=r.threshold,l=void 0===h?.6:h,u=r.maxPatternLength,f=void 0===u?32:u,d=r.caseSensitive,v=void 0!==d&&d,p=r.tokenSeparator,g=void 0===p?/ +/g:p,y=r.findAllMatches,m=void 0!==y&&y,k=r.minMatchCharLength,x=void 0===k?1:k,S=r.id,M=void 0===S?null:S,b=r.keys,_=void 0===b?[]:b,L=r.shouldSort,w=void 0===L||L,C=r.getFn,A=void 0===C?a:C,I=r.sortFn,O=void 0===I?function(e,t){return e.score-t.score}:I,F=r.tokenize,P=void 0!==F&&F,j=r.matchAllTokens,z=void 0!==j&&j,T=r.includeMatches,E=void 0!==T&&T,K=r.includeScore,$=void 0!==K&&K,J=r.verbose,N=void 0!==J&&J;n(this,e),this.options={location:i,distance:c,threshold:l,maxPatternLength:f,isCaseSensitive:v,tokenSeparator:g,findAllMatches:m,minMatchCharLength:x,id:M,keys:_,includeMatches:E,includeScore:$,shouldSort:w,getFn:A,sortFn:O,verbose:N,tokenize:P,matchAllTokens:z},this.setCollection(t)}return o(e,[{key:"setCollection",value:function(e){return this.list=e,e}},{key:"search",value:function(e){this._log('---------\nSearch pattern: "'+e+'"');var t=this._prepareSearchers(e),r=t.tokenSearchers,n=t.fullSearcher,o=this._search(r,n),i=o.weights,a=o.results;return this._computeScore(i,a),this.options.shouldSort&&this._sort(a),this._format(a)}},{key:"_prepareSearchers",value:function(){var e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:"",t=[];if(this.options.tokenize)for(var r=e.split(this.options.tokenSeparator),n=0,o=r.length;n<o;n+=1)t.push(new i(r[n],this.options));return{tokenSearchers:t,fullSearcher:new i(e,this.options)}}},{key:"_search",value:function(){var e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:[],t=arguments[1],r=this.list,n={},o=[];if("string"==typeof r[0]){for(var i=0,a=r.length;i<a;i+=1)this._analyze({key:"",value:r[i],record:i,index:i},{resultMap:n,results:o,tokenSearchers:e,fullSearcher:t});return{weights:null,results:o}}for(var s={},c=0,h=r.length;c<h;c+=1)for(var l=r[c],u=0,f=this.options.keys.length;u<f;u+=1){var d=this.options.keys[u];if("string"!=typeof d){if(s[d.name]={weight:1-d.weight||1},d.weight<=0||d.weight>1)throw new Error("Key weight has to be > 0 and <= 1");d=d.name}else s[d]={weight:1};this._analyze({key:d,value:this.options.getFn(l,d),record:l,index:c},{resultMap:n,results:o,tokenSearchers:e,fullSearcher:t})}return{weights:s,results:o}}},{key:"_analyze",value:function(e,t){var r=e.key,n=e.arrayIndex,o=void 0===n?-1:n,i=e.value,a=e.record,c=e.index,h=t.tokenSearchers,l=void 0===h?[]:h,u=t.fullSearcher,f=void 0===u?[]:u,d=t.resultMap,v=void 0===d?{}:d,p=t.results,g=void 0===p?[]:p;if(void 0!==i&&null!==i){var y=!1,m=-1,k=0;if("string"==typeof i){this._log("\nKey: "+(""===r?"-":r));var x=f.search(i);if(this._log('Full text: "'+i+'", score: '+x.score),this.options.tokenize){for(var S=i.split(this.options.tokenSeparator),M=[],b=0;b<l.length;b+=1){var _=l[b];this._log('\nPattern: "'+_.pattern+'"');for(var L=!1,w=0;w<S.length;w+=1){var C=S[w],A=_.search(C),I={};A.isMatch?(I[C]=A.score,y=!0,L=!0,M.push(A.score)):(I[C]=1,this.options.matchAllTokens||M.push(1)),this._log('Token: "'+C+'", score: '+I[C])}L&&(k+=1)}m=M[0];for(var O=M.length,F=1;F<O;F+=1)m+=M[F];m/=O,this._log("Token score average:",m)}var P=x.score;m>-1&&(P=(P+m)/2),this._log("Score average:",P);var j=!this.options.tokenize||!this.options.matchAllTokens||k>=l.length;if(this._log("\nCheck Matches: "+j),(y||x.isMatch)&&j){var z=v[c];z?z.output.push({key:r,arrayIndex:o,value:i,score:P,matchedIndices:x.matchedIndices}):(v[c]={item:a,output:[{key:r,arrayIndex:o,value:i,score:P,matchedIndices:x.matchedIndices}]},g.push(v[c]))}}else if(s(i))for(var T=0,E=i.length;T<E;T+=1)this._analyze({key:r,arrayIndex:T,value:i[T],record:a,index:c},{resultMap:v,results:g,tokenSearchers:l,fullSearcher:f})}}},{key:"_computeScore",value:function(e,t){this._log("\n\nComputing score:\n");for(var r=0,n=t.length;r<n;r+=1){for(var o=t[r].output,i=o.length,a=0,s=1,c=0;c<i;c+=1){var h=e?e[o[c].key].weight:1,l=1===h?o[c].score:o[c].score||.001,u=l*h;1!==h?s=Math.min(s,u):(o[c].nScore=u,a+=u)}t[r].score=1===s?a/i:s,this._log(t[r])}}},{key:"_sort",value:function(e){this._log("\n\nSorting...."),e.sort(this.options.sortFn)}},{key:"_format",value:function(e){var t=[];this._log("\n\nOutput:\n\n",JSON.stringify(e));var r=[];this.options.includeMatches&&r.push(function(e,t){var r=e.output;t.matches=[];for(var n=0,o=r.length;n<o;n+=1){var i=r[n];if(0!==i.matchedIndices.length){var a={indices:i.matchedIndices,value:i.value};i.key&&(a.key=i.key),i.hasOwnProperty("arrayIndex")&&i.arrayIndex>-1&&(a.arrayIndex=i.arrayIndex),t.matches.push(a)}}}),this.options.includeScore&&r.push(function(e,t){t.score=e.score});for(var n=0,o=e.length;n<o;n+=1){var i=e[n];if(this.options.id&&(i.item=this.options.getFn(i.item,this.options.id)[0]),r.length){for(var a={item:i.item},s=0,c=r.length;s<c;s+=1)r[s](i,a);t.push(a)}else t.push(i.item)}return t}},{key:"_log",value:function(){if(this.options.verbose){var e;(e=console).log.apply(e,arguments)}}}]),e}();e.exports=c}])});
\ No newline at end of file
diff --git a/plugins/search/mark.js b/plugins/search/mark.js
new file mode 100644
index 00000000..c5763bca
--- /dev/null
+++ b/plugins/search/mark.js
@@ -0,0 +1,7 @@
+/*!***************************************************
+* mark.js v8.11.1
+* https://markjs.io/
+* Copyright (c) 2014–2018, Julian Kühnel
+* Released under the MIT license https://git.io/vwTVl
+*****************************************************/
+!function(e,t){"object"==typeof exports&&"undefined"!=typeof module?module.exports=t(require("jquery")):"function"==typeof define&&define.amd?define(["jquery"],t):e.Mark=t(e.jQuery)}(this,function(e){"use strict";e=e&&e.hasOwnProperty("default")?e.default:e;var t="function"==typeof Symbol&&"symbol"==typeof Symbol.iterator?function(e){return typeof e}:function(e){return e&&"function"==typeof Symbol&&e.constructor===Symbol&&e!==Symbol.prototype?"symbol":typeof e},n=function(e,t){if(!(e instanceof t))throw new TypeError("Cannot call a class as a function")},r=function(){function e(e,t){for(var n=0;n<t.length;n++){var r=t[n];r.enumerable=r.enumerable||!1,r.configurable=!0,"value"in r&&(r.writable=!0),Object.defineProperty(e,r.key,r)}}return function(t,n,r){return n&&e(t.prototype,n),r&&e(t,r),t}}(),i=Object.assign||function(e){for(var t=1;t<arguments.length;t++){var n=arguments[t];for(var r in n)Object.prototype.hasOwnProperty.call(n,r)&&(e[r]=n[r])}return e},o=function(){function e(t){var r=!(arguments.length>1&&void 0!==arguments[1])||arguments[1],i=arguments.length>2&&void 0!==arguments[2]?arguments[2]:[],o=arguments.length>3&&void 0!==arguments[3]?arguments[3]:5e3;n(this,e),this.ctx=t,this.iframes=r,this.exclude=i,this.iframesTimeout=o}return r(e,[{key:"getContexts",value:function(){var e=[];return(void 0!==this.ctx&&this.ctx?NodeList.prototype.isPrototypeOf(this.ctx)?Array.prototype.slice.call(this.ctx):Array.isArray(this.ctx)?this.ctx:"string"==typeof this.ctx?Array.prototype.slice.call(document.querySelectorAll(this.ctx)):[this.ctx]:[]).forEach(function(t){var n=e.filter(function(e){return e.contains(t)}).length>0;-1!==e.indexOf(t)||n||e.push(t)}),e}},{key:"getIframeContents",value:function(e,t){var n=arguments.length>2&&void 0!==arguments[2]?arguments[2]:function(){},r=void 0;try{var i=e.contentWindow;if(r=i.document,!i||!r)throw new Error("iframe inaccessible")}catch(e){n()}r&&t(r)}},{key:"isIframeBlank",value:function(e){var t=e.getAttribute("src").trim();return"about:blank"===e.contentWindow.location.href&&"about:blank"!==t&&t}},{key:"observeIframeLoad",value:function(e,t,n){var r=this,i=!1,o=null,a=function a(){if(!i){i=!0,clearTimeout(o);try{r.isIframeBlank(e)||(e.removeEventListener("load",a),r.getIframeContents(e,t,n))}catch(e){n()}}};e.addEventListener("load",a),o=setTimeout(a,this.iframesTimeout)}},{key:"onIframeReady",value:function(e,t,n){try{"complete"===e.contentWindow.document.readyState?this.isIframeBlank(e)?this.observeIframeLoad(e,t,n):this.getIframeContents(e,t,n):this.observeIframeLoad(e,t,n)}catch(e){n()}}},{key:"waitForIframes",value:function(e,t){var n=this,r=0;this.forEachIframe(e,function(){return!0},function(e){r++,n.waitForIframes(e.querySelector("html"),function(){--r||t()})},function(e){e||t()})}},{key:"forEachIframe",value:function(t,n,r){var i=this,o=arguments.length>3&&void 0!==arguments[3]?arguments[3]:function(){},a=t.querySelectorAll("iframe"),s=a.length,c=0;a=Array.prototype.slice.call(a);var u=function(){--s<=0&&o(c)};s||u(),a.forEach(function(t){e.matches(t,i.exclude)?u():i.onIframeReady(t,function(e){n(t)&&(c++,r(e)),u()},u)})}},{key:"createIterator",value:function(e,t,n){return document.createNodeIterator(e,t,n,!1)}},{key:"createInstanceOnIframe",value:function(t){return new e(t.querySelector("html"),this.iframes)}},{key:"compareNodeIframe",value:function(e,t,n){if(e.compareDocumentPosition(n)&Node.DOCUMENT_POSITION_PRECEDING){if(null===t)return!0;if(t.compareDocumentPosition(n)&Node.DOCUMENT_POSITION_FOLLOWING)return!0}return!1}},{key:"getIteratorNode",value:function(e){var t=e.previousNode();return{prevNode:t,node:null===t?e.nextNode():e.nextNode()&&e.nextNode()}}},{key:"checkIframeFilter",value:function(e,t,n,r){var i=!1,o=!1;return r.forEach(function(e,t){e.val===n&&(i=t,o=e.handled)}),this.compareNodeIframe(e,t,n)?(!1!==i||o?!1===i||o||(r[i].handled=!0):r.push({val:n,handled:!0}),!0):(!1===i&&r.push({val:n,handled:!1}),!1)}},{key:"handleOpenIframes",value:function(e,t,n,r){var i=this;e.forEach(function(e){e.handled||i.getIframeContents(e.val,function(e){i.createInstanceOnIframe(e).forEachNode(t,n,r)})})}},{key:"iterateThroughNodes",value:function(e,t,n,r,i){for(var o,a=this,s=this.createIterator(t,e,r),c=[],u=[],l=void 0,h=void 0;void 0,o=a.getIteratorNode(s),h=o.prevNode,l=o.node;)this.iframes&&this.forEachIframe(t,function(e){return a.checkIframeFilter(l,h,e,c)},function(t){a.createInstanceOnIframe(t).forEachNode(e,function(e){return u.push(e)},r)}),u.push(l);u.forEach(function(e){n(e)}),this.iframes&&this.handleOpenIframes(c,e,n,r),i()}},{key:"forEachNode",value:function(e,t,n){var r=this,i=arguments.length>3&&void 0!==arguments[3]?arguments[3]:function(){},o=this.getContexts(),a=o.length;a||i(),o.forEach(function(o){var s=function(){r.iterateThroughNodes(e,o,t,n,function(){--a<=0&&i()})};r.iframes?r.waitForIframes(o,s):s()})}}],[{key:"matches",value:function(e,t){var n="string"==typeof t?[t]:t,r=e.matches||e.matchesSelector||e.msMatchesSelector||e.mozMatchesSelector||e.oMatchesSelector||e.webkitMatchesSelector;if(r){var i=!1;return n.every(function(t){return!r.call(e,t)||(i=!0,!1)}),i}return!1}}]),e}(),a=function(){function e(t){n(this,e),this.ctx=t,this.ie=!1;var r=window.navigator.userAgent;(r.indexOf("MSIE")>-1||r.indexOf("Trident")>-1)&&(this.ie=!0)}return r(e,[{key:"log",value:function(e){var n=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"debug",r=this.opt.log;this.opt.debug&&"object"===(void 0===r?"undefined":t(r))&&"function"==typeof r[n]&&r[n]("mark.js: "+e)}},{key:"escapeStr",value:function(e){return e.replace(/[\-\[\]\/\{\}\(\)\*\+\?\.\\\^\$\|]/g,"\\$&")}},{key:"createRegExp",value:function(e){return"disabled"!==this.opt.wildcards&&(e=this.setupWildcardsRegExp(e)),e=this.escapeStr(e),Object.keys(this.opt.synonyms).length&&(e=this.createSynonymsRegExp(e)),(this.opt.ignoreJoiners||this.opt.ignorePunctuation.length)&&(e=this.setupIgnoreJoinersRegExp(e)),this.opt.diacritics&&(e=this.createDiacriticsRegExp(e)),e=this.createMergedBlanksRegExp(e),(this.opt.ignoreJoiners||this.opt.ignorePunctuation.length)&&(e=this.createJoinersRegExp(e)),"disabled"!==this.opt.wildcards&&(e=this.createWildcardsRegExp(e)),e=this.createAccuracyRegExp(e)}},{key:"createSynonymsRegExp",value:function(e){var t=this.opt.synonyms,n=this.opt.caseSensitive?"":"i",r=this.opt.ignoreJoiners||this.opt.ignorePunctuation.length?"\0":"";for(var i in t)if(t.hasOwnProperty(i)){var o=t[i],a="disabled"!==this.opt.wildcards?this.setupWildcardsRegExp(i):this.escapeStr(i),s="disabled"!==this.opt.wildcards?this.setupWildcardsRegExp(o):this.escapeStr(o);""!==a&&""!==s&&(e=e.replace(new RegExp("("+this.escapeStr(a)+"|"+this.escapeStr(s)+")","gm"+n),r+"("+this.processSynomyms(a)+"|"+this.processSynomyms(s)+")"+r))}return e}},{key:"processSynomyms",value:function(e){return(this.opt.ignoreJoiners||this.opt.ignorePunctuation.length)&&(e=this.setupIgnoreJoinersRegExp(e)),e}},{key:"setupWildcardsRegExp",value:function(e){return(e=e.replace(/(?:\\)*\?/g,function(e){return"\\"===e.charAt(0)?"?":""})).replace(/(?:\\)*\*/g,function(e){return"\\"===e.charAt(0)?"*":""})}},{key:"createWildcardsRegExp",value:function(e){var t="withSpaces"===this.opt.wildcards;return e.replace(/\u0001/g,t?"[\\S\\s]?":"\\S?").replace(/\u0002/g,t?"[\\S\\s]*?":"\\S*")}},{key:"setupIgnoreJoinersRegExp",value:function(e){return e.replace(/[^(|)\\]/g,function(e,t,n){var r=n.charAt(t+1);return/[(|)\\]/.test(r)||""===r?e:e+"\0"})}},{key:"createJoinersRegExp",value:function(e){var t=[],n=this.opt.ignorePunctuation;return Array.isArray(n)&&n.length&&t.push(this.escapeStr(n.join(""))),this.opt.ignoreJoiners&&t.push("\\u00ad\\u200b\\u200c\\u200d"),t.length?e.split(/\u0000+/).join("["+t.join("")+"]*"):e}},{key:"createDiacriticsRegExp",value:function(e){var t=this.opt.caseSensitive?"":"i",n=this.opt.caseSensitive?["aàáảãạăằắẳẵặâầấẩẫậäåāą","AÀÁẢÃẠĂẰẮẲẴẶÂẦẤẨẪẬÄÅĀĄ","cçćč","CÇĆČ","dđď","DĐĎ","eèéẻẽẹêềếểễệëěēę","EÈÉẺẼẸÊỀẾỂỄỆËĚĒĘ","iìíỉĩịîïī","IÌÍỈĨỊÎÏĪ","lł","LŁ","nñňń","NÑŇŃ","oòóỏõọôồốổỗộơởỡớờợöøō","OÒÓỎÕỌÔỒỐỔỖỘƠỞỠỚỜỢÖØŌ","rř","RŘ","sšśșş","SŠŚȘŞ","tťțţ","TŤȚŢ","uùúủũụưừứửữựûüůū","UÙÚỦŨỤƯỪỨỬỮỰÛÜŮŪ","yýỳỷỹỵÿ","YÝỲỶỸỴŸ","zžżź","ZŽŻŹ"]:["aàáảãạăằắẳẵặâầấẩẫậäåāąAÀÁẢÃẠĂẰẮẲẴẶÂẦẤẨẪẬÄÅĀĄ","cçćčCÇĆČ","dđďDĐĎ","eèéẻẽẹêềếểễệëěēęEÈÉẺẼẸÊỀẾỂỄỆËĚĒĘ","iìíỉĩịîïīIÌÍỈĨỊÎÏĪ","lłLŁ","nñňńNÑŇŃ","oòóỏõọôồốổỗộơởỡớờợöøōOÒÓỎÕỌÔỒỐỔỖỘƠỞỠỚỜỢÖØŌ","rřRŘ","sšśșşSŠŚȘŞ","tťțţTŤȚŢ","uùúủũụưừứửữựûüůūUÙÚỦŨỤƯỪỨỬỮỰÛÜŮŪ","yýỳỷỹỵÿYÝỲỶỸỴŸ","zžżźZŽŻŹ"],r=[];return e.split("").forEach(function(i){n.every(function(n){if(-1!==n.indexOf(i)){if(r.indexOf(n)>-1)return!1;e=e.replace(new RegExp("["+n+"]","gm"+t),"["+n+"]"),r.push(n)}return!0})}),e}},{key:"createMergedBlanksRegExp",value:function(e){return e.replace(/[\s]+/gim,"[\\s]+")}},{key:"createAccuracyRegExp",value:function(e){var t=this,n=this.opt.accuracy,r="string"==typeof n?n:n.value,i="";switch(("string"==typeof n?[]:n.limiters).forEach(function(e){i+="|"+t.escapeStr(e)}),r){case"partially":default:return"()("+e+")";case"complementary":return"()([^"+(i="\\s"+(i||this.escapeStr("!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~¡¿")))+"]*"+e+"[^"+i+"]*)";case"exactly":return"(^|\\s"+i+")("+e+")(?=$|\\s"+i+")"}}},{key:"getSeparatedKeywords",value:function(e){var t=this,n=[];return e.forEach(function(e){t.opt.separateWordSearch?e.split(" ").forEach(function(e){e.trim()&&-1===n.indexOf(e)&&n.push(e)}):e.trim()&&-1===n.indexOf(e)&&n.push(e)}),{keywords:n.sort(function(e,t){return t.length-e.length}),length:n.length}}},{key:"isNumeric",value:function(e){return Number(parseFloat(e))==e}},{key:"checkRanges",value:function(e){var t=this;if(!Array.isArray(e)||"[object Object]"!==Object.prototype.toString.call(e[0]))return this.log("markRanges() will only accept an array of objects"),this.opt.noMatch(e),[];var n=[],r=0;return e.sort(function(e,t){return e.start-t.start}).forEach(function(e){var i=t.callNoMatchOnInvalidRanges(e,r),o=i.start,a=i.end;i.valid&&(e.start=o,e.length=a-o,n.push(e),r=a)}),n}},{key:"callNoMatchOnInvalidRanges",value:function(e,t){var n=void 0,r=void 0,i=!1;return e&&void 0!==e.start?(r=(n=parseInt(e.start,10))+parseInt(e.length,10),this.isNumeric(e.start)&&this.isNumeric(e.length)&&r-t>0&&r-n>0?i=!0:(this.log("Ignoring invalid or overlapping range: "+JSON.stringify(e)),this.opt.noMatch(e))):(this.log("Ignoring invalid range: "+JSON.stringify(e)),this.opt.noMatch(e)),{start:n,end:r,valid:i}}},{key:"checkWhitespaceRanges",value:function(e,t,n){var r=void 0,i=!0,o=n.length,a=t-o,s=parseInt(e.start,10)-a;return(r=(s=s>o?o:s)+parseInt(e.length,10))>o&&(r=o,this.log("End range automatically set to the max value of "+o)),s<0||r-s<0||s>o||r>o?(i=!1,this.log("Invalid range: "+JSON.stringify(e)),this.opt.noMatch(e)):""===n.substring(s,r).replace(/\s+/g,"")&&(i=!1,this.log("Skipping whitespace only range: "+JSON.stringify(e)),this.opt.noMatch(e)),{start:s,end:r,valid:i}}},{key:"getTextNodes",value:function(e){var t=this,n="",r=[];this.iterator.forEachNode(NodeFilter.SHOW_TEXT,function(e){r.push({start:n.length,end:(n+=e.textContent).length,node:e})},function(e){return t.matchesExclude(e.parentNode)?NodeFilter.FILTER_REJECT:NodeFilter.FILTER_ACCEPT},function(){e({value:n,nodes:r})})}},{key:"matchesExclude",value:function(e){return o.matches(e,this.opt.exclude.concat(["script","style","title","head","html"]))}},{key:"wrapRangeInTextNode",value:function(e,t,n){var r=this.opt.element?this.opt.element:"mark",i=e.splitText(t),o=i.splitText(n-t),a=document.createElement(r);return a.setAttribute("data-markjs","true"),this.opt.className&&a.setAttribute("class",this.opt.className),a.textContent=i.textContent,i.parentNode.replaceChild(a,i),o}},{key:"wrapRangeInMappedTextNode",value:function(e,t,n,r,i){var o=this;e.nodes.every(function(a,s){var c=e.nodes[s+1];if(void 0===c||c.start>t){if(!r(a.node))return!1;var u=t-a.start,l=(n>a.end?a.end:n)-a.start,h=e.value.substr(0,a.start),f=e.value.substr(l+a.start);if(a.node=o.wrapRangeInTextNode(a.node,u,l),e.value=h+f,e.nodes.forEach(function(t,n){n>=s&&(e.nodes[n].start>0&&n!==s&&(e.nodes[n].start-=l),e.nodes[n].end-=l)}),n-=l,i(a.node.previousSibling,a.start),!(n>a.end))return!1;t=a.end}return!0})}},{key:"wrapMatches",value:function(e,t,n,r,i){var o=this,a=0===t?0:t+1;this.getTextNodes(function(t){t.nodes.forEach(function(t){t=t.node;for(var i=void 0;null!==(i=e.exec(t.textContent))&&""!==i[a];)if(n(i[a],t)){var s=i.index;if(0!==a)for(var c=1;c<a;c++)s+=i[c].length;t=o.wrapRangeInTextNode(t,s,s+i[a].length),r(t.previousSibling),e.lastIndex=0}}),i()})}},{key:"wrapMatchesAcrossElements",value:function(e,t,n,r,i){var o=this,a=0===t?0:t+1;this.getTextNodes(function(t){for(var s=void 0;null!==(s=e.exec(t.value))&&""!==s[a];){var c=s.index;if(0!==a)for(var u=1;u<a;u++)c+=s[u].length;var l=c+s[a].length;o.wrapRangeInMappedTextNode(t,c,l,function(e){return n(s[a],e)},function(t,n){e.lastIndex=n,r(t)})}i()})}},{key:"wrapRangeFromIndex",value:function(e,t,n,r){var i=this;this.getTextNodes(function(o){var a=o.value.length;e.forEach(function(e,r){var s=i.checkWhitespaceRanges(e,a,o.value),c=s.start,u=s.end;s.valid&&i.wrapRangeInMappedTextNode(o,c,u,function(n){return t(n,e,o.value.substring(c,u),r)},function(t){n(t,e)})}),r()})}},{key:"unwrapMatches",value:function(e){for(var t=e.parentNode,n=document.createDocumentFragment();e.firstChild;)n.appendChild(e.removeChild(e.firstChild));t.replaceChild(n,e),this.ie?this.normalizeTextNode(t):t.normalize()}},{key:"normalizeTextNode",value:function(e){if(e){if(3===e.nodeType)for(;e.nextSibling&&3===e.nextSibling.nodeType;)e.nodeValue+=e.nextSibling.nodeValue,e.parentNode.removeChild(e.nextSibling);else this.normalizeTextNode(e.firstChild);this.normalizeTextNode(e.nextSibling)}}},{key:"markRegExp",value:function(e,t){var n=this;this.opt=t,this.log('Searching with expression "'+e+'"');var r=0,i="wrapMatches";this.opt.acrossElements&&(i="wrapMatchesAcrossElements"),this[i](e,this.opt.ignoreGroups,function(e,t){return n.opt.filter(t,e,r)},function(e){r++,n.opt.each(e)},function(){0===r&&n.opt.noMatch(e),n.opt.done(r)})}},{key:"mark",value:function(e,t){var n=this;this.opt=t;var r=0,i="wrapMatches",o=this.getSeparatedKeywords("string"==typeof e?[e]:e),a=o.keywords,s=o.length,c=this.opt.caseSensitive?"":"i";this.opt.acrossElements&&(i="wrapMatchesAcrossElements"),0===s?this.opt.done(r):function e(t){var o=new RegExp(n.createRegExp(t),"gm"+c),u=0;n.log('Searching with expression "'+o+'"'),n[i](o,1,function(e,i){return n.opt.filter(i,t,r,u)},function(e){u++,r++,n.opt.each(e)},function(){0===u&&n.opt.noMatch(t),a[s-1]===t?n.opt.done(r):e(a[a.indexOf(t)+1])})}(a[0])}},{key:"markRanges",value:function(e,t){var n=this;this.opt=t;var r=0,i=this.checkRanges(e);i&&i.length?(this.log("Starting to mark with the following ranges: "+JSON.stringify(i)),this.wrapRangeFromIndex(i,function(e,t,r,i){return n.opt.filter(e,t,r,i)},function(e,t){r++,n.opt.each(e,t)},function(){n.opt.done(r)})):this.opt.done(r)}},{key:"unmark",value:function(e){var t=this;this.opt=e;var n=this.opt.element?this.opt.element:"*";n+="[data-markjs]",this.opt.className&&(n+="."+this.opt.className),this.log('Removal selector "'+n+'"'),this.iterator.forEachNode(NodeFilter.SHOW_ELEMENT,function(e){t.unwrapMatches(e)},function(e){var r=o.matches(e,n),i=t.matchesExclude(e);return!r||i?NodeFilter.FILTER_REJECT:NodeFilter.FILTER_ACCEPT},this.opt.done)}},{key:"opt",set:function(e){this._opt=i({},{element:"",className:"",exclude:[],iframes:!1,iframesTimeout:5e3,separateWordSearch:!0,diacritics:!0,synonyms:{},accuracy:"partially",acrossElements:!1,caseSensitive:!1,ignoreJoiners:!1,ignoreGroups:0,ignorePunctuation:[],wildcards:"disabled",each:function(){},noMatch:function(){},filter:function(){return!0},done:function(){},debug:!1,log:window.console},e)},get:function(){return this._opt}},{key:"iterator",get:function(){return new o(this.ctx,this.opt.iframes,this.opt.exclude,this.opt.iframesTimeout)}}]),e}();return e.fn.mark=function(e,t){return new a(this.get()).mark(e,t),this},e.fn.markRegExp=function(e,t){return new a(this.get()).markRegExp(e,t),this},e.fn.markRanges=function(e,t){return new a(this.get()).markRanges(e,t),this},e.fn.unmark=function(e){return new a(this.get()).unmark(e),this},e});
diff --git a/plugins/search/search.js b/plugins/search/search.js
new file mode 100644
index 00000000..e4437d22
--- /dev/null
+++ b/plugins/search/search.js
@@ -0,0 +1,106 @@
+summaryInclude=60;
+var fuseOptions = {
+  shouldSort: true,
+  includeMatches: true,
+  threshold: 0.0,
+  tokenize:true,
+  location: 0,
+  distance: 100,
+  maxPatternLength: 32,
+  minMatchCharLength: 1,
+  keys: [
+    {name:"title",weight:0.8},
+    {name:"contents",weight:0.5},
+    {name:"tags",weight:0.3},
+    {name:"categories",weight:0.3}
+  ]
+};
+
+
+var searchQuery = param("s");
+if(searchQuery){
+  $("#search-query").val(searchQuery);
+  executeSearch(searchQuery);
+}
+
+
+
+function executeSearch(searchQuery){
+  $.getJSON( indexURL, function( data ) {
+    var pages = data;
+    var fuse = new Fuse(pages, fuseOptions);
+    var result = fuse.search(searchQuery);
+    console.log({"matches":result});
+    if(result.length > 0){
+      populateResults(result);
+    }else{
+      $('#search-results').append("<p>No matches found</p>");
+    }
+  });
+}
+
+function populateResults(result){
+  $.each(result,function(key,value){
+    var contents= value.item.contents;
+    var snippet = "";
+    var snippetHighlights=[];
+    var tags =[];
+    if( fuseOptions.tokenize ){
+      snippetHighlights.push(searchQuery);
+    }else{
+      $.each(value.matches,function(matchKey,mvalue){
+        if(mvalue.key == "tags" || mvalue.key == "categories" ){
+          snippetHighlights.push(mvalue.value);
+        }else if(mvalue.key == "contents"){
+          start = mvalue.indices[0][0]-summaryInclude>0?mvalue.indices[0][0]-summaryInclude:0;
+          end = mvalue.indices[0][1]+summaryInclude<contents.length?mvalue.indices[0][1]+summaryInclude:contents.length;
+          snippet += contents.substring(start,end);
+          snippetHighlights.push(mvalue.value.substring(mvalue.indices[0][0],mvalue.indices[0][1]-mvalue.indices[0][0]+1));
+        }
+      });
+    }
+
+    if(snippet.length<1){
+      snippet += contents.substring(0,summaryInclude*2);
+    }
+    //pull template from hugo templarte definition
+    var templateDefinition = $('#search-result-template').html();
+    //replace values
+    var output = render(templateDefinition,{key:key,title:value.item.title,link:value.item.permalink,tags:value.item.tags,categories:value.item.categories,snippet:snippet});
+    $('#search-results').append(output);
+
+    $.each(snippetHighlights,function(snipkey,snipvalue){
+      $("#summary-"+key).mark(snipvalue);
+    });
+
+  });
+}
+
+function param(name) {
+    return decodeURIComponent((location.search.split(name + '=')[1] || '').split('&')[0]).replace(/\+/g, ' ');
+}
+
+function render(templateString, data) {
+  var conditionalMatches,conditionalPattern,copy;
+  conditionalPattern = /\$\{\s*isset ([a-zA-Z]*) \s*\}(.*)\$\{\s*end\s*}/g;
+  //since loop below depends on re.lastInxdex, we use a copy to capture any manipulations whilst inside the loop
+  copy = templateString;
+  while ((conditionalMatches = conditionalPattern.exec(templateString)) !== null) {
+    if(data[conditionalMatches[1]]){
+      //valid key, remove conditionals, leave contents.
+      copy = copy.replace(conditionalMatches[0],conditionalMatches[2]);
+    }else{
+      //not valid, remove entire section
+      copy = copy.replace(conditionalMatches[0],'');
+    }
+  }
+  templateString = copy;
+  //now any conditionals removed we can do simple substitution
+  var key, find, re;
+  for (key in data) {
+    find = '\\$\\{\\s*' + key + '\\s*\\}';
+    re = new RegExp(find, 'g');
+    templateString = templateString.replace(re, data[key]);
+  }
+  return templateString;
+}
diff --git a/plugins/slick/ajax-loader.gif b/plugins/slick/ajax-loader.gif
new file mode 100644
index 00000000..e0e6e976
Binary files /dev/null and b/plugins/slick/ajax-loader.gif differ
diff --git a/plugins/slick/fonts/slick.eot b/plugins/slick/fonts/slick.eot
new file mode 100644
index 00000000..2cbab9ca
Binary files /dev/null and b/plugins/slick/fonts/slick.eot differ
diff --git a/plugins/slick/fonts/slick.svg b/plugins/slick/fonts/slick.svg
new file mode 100644
index 00000000..b36a66a6
--- /dev/null
+++ b/plugins/slick/fonts/slick.svg
@@ -0,0 +1,14 @@
+<?xml version="1.0" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg xmlns="http://www.w3.org/2000/svg">
+<metadata>Generated by Fontastic.me</metadata>
+<defs>
+<font id="slick" horiz-adv-x="512">
+<font-face font-family="slick" units-per-em="512" ascent="480" descent="-32"/>
+<missing-glyph horiz-adv-x="512" />
+
+<glyph unicode="&#8594;" d="M241 113l130 130c4 4 6 8 6 13 0 5-2 9-6 13l-130 130c-3 3-7 5-12 5-5 0-10-2-13-5l-29-30c-4-3-6-7-6-12 0-5 2-10 6-13l87-88-87-88c-4-3-6-8-6-13 0-5 2-9 6-12l29-30c3-3 8-5 13-5 5 0 9 2 12 5z m234 143c0-40-9-77-29-110-20-34-46-60-80-80-33-20-70-29-110-29-40 0-77 9-110 29-34 20-60 46-80 80-20 33-29 70-29 110 0 40 9 77 29 110 20 34 46 60 80 80 33 20 70 29 110 29 40 0 77-9 110-29 34-20 60-46 80-80 20-33 29-70 29-110z"/>
+<glyph unicode="&#8592;" d="M296 113l29 30c4 3 6 7 6 12 0 5-2 10-6 13l-87 88 87 88c4 3 6 8 6 13 0 5-2 9-6 12l-29 30c-3 3-8 5-13 5-5 0-9-2-12-5l-130-130c-4-4-6-8-6-13 0-5 2-9 6-13l130-130c3-3 7-5 12-5 5 0 10 2 13 5z m179 143c0-40-9-77-29-110-20-34-46-60-80-80-33-20-70-29-110-29-40 0-77 9-110 29-34 20-60 46-80 80-20 33-29 70-29 110 0 40 9 77 29 110 20 34 46 60 80 80 33 20 70 29 110 29 40 0 77-9 110-29 34-20 60-46 80-80 20-33 29-70 29-110z"/>
+<glyph unicode="&#8226;" d="M475 256c0-40-9-77-29-110-20-34-46-60-80-80-33-20-70-29-110-29-40 0-77 9-110 29-34 20-60 46-80 80-20 33-29 70-29 110 0 40 9 77 29 110 20 34 46 60 80 80 33 20 70 29 110 29 40 0 77-9 110-29 34-20 60-46 80-80 20-33 29-70 29-110z"/>
+<glyph unicode="&#97;" d="M475 439l0-128c0-5-1-9-5-13-4-4-8-5-13-5l-128 0c-8 0-13 3-17 11-3 7-2 14 4 20l40 39c-28 26-62 39-100 39-20 0-39-4-57-11-18-8-33-18-46-32-14-13-24-28-32-46-7-18-11-37-11-57 0-20 4-39 11-57 8-18 18-33 32-46 13-14 28-24 46-32 18-7 37-11 57-11 23 0 44 5 64 15 20 9 38 23 51 42 2 1 4 3 7 3 3 0 5-1 7-3l39-39c2-2 3-3 3-6 0-2-1-4-2-6-21-25-46-45-76-59-29-14-60-20-93-20-30 0-58 5-85 17-27 12-51 27-70 47-20 19-35 43-47 70-12 27-17 55-17 85 0 30 5 58 17 85 12 27 27 51 47 70 19 20 43 35 70 47 27 12 55 17 85 17 28 0 55-5 81-15 26-11 50-26 70-45l37 37c6 6 12 7 20 4 8-4 11-9 11-17z"/>
+</font></defs></svg>
diff --git a/plugins/slick/fonts/slick.ttf b/plugins/slick/fonts/slick.ttf
new file mode 100644
index 00000000..9d03461b
Binary files /dev/null and b/plugins/slick/fonts/slick.ttf differ
diff --git a/plugins/slick/fonts/slick.woff b/plugins/slick/fonts/slick.woff
new file mode 100644
index 00000000..8ee99721
Binary files /dev/null and b/plugins/slick/fonts/slick.woff differ
diff --git a/plugins/slick/slick.css b/plugins/slick/slick.css
new file mode 100644
index 00000000..57477e84
--- /dev/null
+++ b/plugins/slick/slick.css
@@ -0,0 +1,119 @@
+/* Slider */
+.slick-slider
+{
+    position: relative;
+
+    display: block;
+    box-sizing: border-box;
+
+    -webkit-user-select: none;
+       -moz-user-select: none;
+        -ms-user-select: none;
+            user-select: none;
+
+    -webkit-touch-callout: none;
+    -khtml-user-select: none;
+    -ms-touch-action: pan-y;
+        touch-action: pan-y;
+    -webkit-tap-highlight-color: transparent;
+}
+
+.slick-list
+{
+    position: relative;
+
+    display: block;
+    overflow: hidden;
+
+    margin: 0;
+    padding: 0;
+}
+.slick-list:focus
+{
+    outline: none;
+}
+.slick-list.dragging
+{
+    cursor: pointer;
+    cursor: hand;
+}
+
+.slick-slider .slick-track,
+.slick-slider .slick-list
+{
+    -webkit-transform: translate3d(0, 0, 0);
+       -moz-transform: translate3d(0, 0, 0);
+        -ms-transform: translate3d(0, 0, 0);
+         -o-transform: translate3d(0, 0, 0);
+            transform: translate3d(0, 0, 0);
+}
+
+.slick-track
+{
+    position: relative;
+    top: 0;
+    left: 0;
+
+    display: block;
+    margin-left: auto;
+    margin-right: auto;
+}
+.slick-track:before,
+.slick-track:after
+{
+    display: table;
+
+    content: '';
+}
+.slick-track:after
+{
+    clear: both;
+}
+.slick-loading .slick-track
+{
+    visibility: hidden;
+}
+
+.slick-slide
+{
+    display: none;
+    float: left;
+
+    height: 100%;
+    min-height: 1px;
+}
+[dir='rtl'] .slick-slide
+{
+    float: right;
+}
+.slick-slide img
+{
+    display: block;
+}
+.slick-slide.slick-loading img
+{
+    display: none;
+}
+.slick-slide.dragging img
+{
+    pointer-events: none;
+}
+.slick-initialized .slick-slide
+{
+    display: block;
+}
+.slick-loading .slick-slide
+{
+    visibility: hidden;
+}
+.slick-vertical .slick-slide
+{
+    display: block;
+
+    height: auto;
+
+    border: 1px solid transparent;
+}
+.slick-arrow.slick-hidden {
+    display: none;
+}
diff --git a/plugins/slick/slick.min.js b/plugins/slick/slick.min.js
new file mode 100644
index 00000000..fc01eb83
--- /dev/null
+++ b/plugins/slick/slick.min.js
@@ -0,0 +1,7 @@
+!function(i){"use strict";"function"==typeof define&&define.amd?define(["jquery"],i):"undefined"!=typeof exports?module.exports=i(require("jquery")):i(jQuery)}(function(i){"use strict";var e=window.Slick||{};(e=function(){var e=0;return function(t,o){var s,n=this;n.defaults={accessibility:!0,adaptiveHeight:!1,appendArrows:i(t),appendDots:i(t),arrows:!0,asNavFor:null,prevArrow:'<button class="slick-prev" aria-label="Previous" type="button">Previous</button>',nextArrow:'<button class="slick-next" aria-label="Next" type="button">Next</button>',autoplay:!1,autoplaySpeed:3e3,centerMode:!1,centerPadding:"50px",cssEase:"ease",customPaging:function(e,t){return i('<button type="button" />').text(t+1)},dots:!1,dotsClass:"slick-dots",draggable:!0,easing:"linear",edgeFriction:.35,fade:!1,focusOnSelect:!1,focusOnChange:!1,infinite:!0,initialSlide:0,lazyLoad:"ondemand",mobileFirst:!1,pauseOnHover:!0,pauseOnFocus:!0,pauseOnDotsHover:!1,respondTo:"window",responsive:null,rows:1,rtl:!1,slide:"",slidesPerRow:1,slidesToShow:1,slidesToScroll:1,speed:500,swipe:!0,swipeToSlide:!1,touchMove:!0,touchThreshold:5,useCSS:!0,useTransform:!0,variableWidth:!1,vertical:!1,verticalSwiping:!1,waitForAnimate:!0,zIndex:1e3},n.initials={animating:!1,dragging:!1,autoPlayTimer:null,currentDirection:0,currentLeft:null,currentSlide:0,direction:1,$dots:null,listWidth:null,listHeight:null,loadIndex:0,$nextArrow:null,$prevArrow:null,scrolling:!1,slideCount:null,slideWidth:null,$slideTrack:null,$slides:null,sliding:!1,slideOffset:0,swipeLeft:null,swiping:!1,$list:null,touchObject:{},transformsEnabled:!1,unslicked:!1},i.extend(n,n.initials),n.activeBreakpoint=null,n.animType=null,n.animProp=null,n.breakpoints=[],n.breakpointSettings=[],n.cssTransitions=!1,n.focussed=!1,n.interrupted=!1,n.hidden="hidden",n.paused=!0,n.positionProp=null,n.respondTo=null,n.rowCount=1,n.shouldClick=!0,n.$slider=i(t),n.$slidesCache=null,n.transformType=null,n.transitionType=null,n.visibilityChange="visibilitychange",n.windowWidth=0,n.windowTimer=null,s=i(t).data("slick")||{},n.options=i.extend({},n.defaults,o,s),n.currentSlide=n.options.initialSlide,n.originalSettings=n.options,void 0!==document.mozHidden?(n.hidden="mozHidden",n.visibilityChange="mozvisibilitychange"):void 0!==document.webkitHidden&&(n.hidden="webkitHidden",n.visibilityChange="webkitvisibilitychange"),n.autoPlay=i.proxy(n.autoPlay,n),n.autoPlayClear=i.proxy(n.autoPlayClear,n),n.autoPlayIterator=i.proxy(n.autoPlayIterator,n),n.changeSlide=i.proxy(n.changeSlide,n),n.clickHandler=i.proxy(n.clickHandler,n),n.selectHandler=i.proxy(n.selectHandler,n),n.setPosition=i.proxy(n.setPosition,n),n.swipeHandler=i.proxy(n.swipeHandler,n),n.dragHandler=i.proxy(n.dragHandler,n),n.keyHandler=i.proxy(n.keyHandler,n),n.instanceUid=e++,n.htmlExpr=/^(?:\s*(<[\w\W]+>)[^>]*)$/,n.registerBreakpoints(),n.init(!0)}}()).prototype.activateADA=function(){this.$slideTrack.find(".slick-active").attr({"aria-hidden":"false"}).find("a, input, button, select").attr({tabindex:"0"})},e.prototype.addSlide=e.prototype.slickAdd=function(e,t,o){var s=this;if("boolean"==typeof t)o=t,t=null;else if(t<0||t>=s.slideCount)return!1;s.unload(),"number"==typeof t?0===t&&0===s.$slides.length?i(e).appendTo(s.$slideTrack):o?i(e).insertBefore(s.$slides.eq(t)):i(e).insertAfter(s.$slides.eq(t)):!0===o?i(e).prependTo(s.$slideTrack):i(e).appendTo(s.$slideTrack),s.$slides=s.$slideTrack.children(this.options.slide),s.$slideTrack.children(this.options.slide).detach(),s.$slideTrack.append(s.$slides),s.$slides.each(function(e,t){i(t).attr("data-slick-index",e)}),s.$slidesCache=s.$slides,s.reinit()},e.prototype.animateHeight=function(){var i=this;if(1===i.options.slidesToShow&&!0===i.options.adaptiveHeight&&!1===i.options.vertical){var e=i.$slides.eq(i.currentSlide).outerHeight(!0);i.$list.animate({height:e},i.options.speed)}},e.prototype.animateSlide=function(e,t){var o={},s=this;s.animateHeight(),!0===s.options.rtl&&!1===s.options.vertical&&(e=-e),!1===s.transformsEnabled?!1===s.options.vertical?s.$slideTrack.animate({left:e},s.options.speed,s.options.easing,t):s.$slideTrack.animate({top:e},s.options.speed,s.options.easing,t):!1===s.cssTransitions?(!0===s.options.rtl&&(s.currentLeft=-s.currentLeft),i({animStart:s.currentLeft}).animate({animStart:e},{duration:s.options.speed,easing:s.options.easing,step:function(i){i=Math.ceil(i),!1===s.options.vertical?(o[s.animType]="translate("+i+"px, 0px)",s.$slideTrack.css(o)):(o[s.animType]="translate(0px,"+i+"px)",s.$slideTrack.css(o))},complete:function(){t&&t.call()}})):(s.applyTransition(),e=Math.ceil(e),!1===s.options.vertical?o[s.animType]="translate3d("+e+"px, 0px, 0px)":o[s.animType]="translate3d(0px,"+e+"px, 0px)",s.$slideTrack.css(o),t&&setTimeout(function(){s.disableTransition(),t.call()},s.options.speed))},e.prototype.getNavTarget=function(){var e=this,t=e.options.asNavFor;return t&&null!==t&&(t=i(t).not(e.$slider)),t},e.prototype.asNavFor=function(e){var t=this.getNavTarget();null!==t&&"object"==typeof t&&t.each(function(){var t=i(this).slick("getSlick");t.unslicked||t.slideHandler(e,!0)})},e.prototype.applyTransition=function(i){var e=this,t={};!1===e.options.fade?t[e.transitionType]=e.transformType+" "+e.options.speed+"ms "+e.options.cssEase:t[e.transitionType]="opacity "+e.options.speed+"ms "+e.options.cssEase,!1===e.options.fade?e.$slideTrack.css(t):e.$slides.eq(i).css(t)},e.prototype.autoPlay=function(){var i=this;i.autoPlayClear(),i.slideCount>i.options.slidesToShow&&(i.autoPlayTimer=setInterval(i.autoPlayIterator,i.options.autoplaySpeed))},e.prototype.autoPlayClear=function(){var i=this;i.autoPlayTimer&&clearInterval(i.autoPlayTimer)},e.prototype.autoPlayIterator=function(){var i=this,e=i.currentSlide+i.options.slidesToScroll;i.paused||i.interrupted||i.focussed||(!1===i.options.infinite&&(1===i.direction&&i.currentSlide+1===i.slideCount-1?i.direction=0:0===i.direction&&(e=i.currentSlide-i.options.slidesToScroll,i.currentSlide-1==0&&(i.direction=1))),i.slideHandler(e))},e.prototype.buildArrows=function(){var e=this;!0===e.options.arrows&&(e.$prevArrow=i(e.options.prevArrow).addClass("slick-arrow"),e.$nextArrow=i(e.options.nextArrow).addClass("slick-arrow"),e.slideCount>e.options.slidesToShow?(e.$prevArrow.removeClass("slick-hidden").removeAttr("aria-hidden tabindex"),e.$nextArrow.removeClass("slick-hidden").removeAttr("aria-hidden tabindex"),e.htmlExpr.test(e.options.prevArrow)&&e.$prevArrow.prependTo(e.options.appendArrows),e.htmlExpr.test(e.options.nextArrow)&&e.$nextArrow.appendTo(e.options.appendArrows),!0!==e.options.infinite&&e.$prevArrow.addClass("slick-disabled").attr("aria-disabled","true")):e.$prevArrow.add(e.$nextArrow).addClass("slick-hidden").attr({"aria-disabled":"true",tabindex:"-1"}))},e.prototype.buildDots=function(){var e,t,o=this;if(!0===o.options.dots){for(o.$slider.addClass("slick-dotted"),t=i("<ul />").addClass(o.options.dotsClass),e=0;e<=o.getDotCount();e+=1)t.append(i("<li />").append(o.options.customPaging.call(this,o,e)));o.$dots=t.appendTo(o.options.appendDots),o.$dots.find("li").first().addClass("slick-active")}},e.prototype.buildOut=function(){var e=this;e.$slides=e.$slider.children(e.options.slide+":not(.slick-cloned)").addClass("slick-slide"),e.slideCount=e.$slides.length,e.$slides.each(function(e,t){i(t).attr("data-slick-index",e).data("originalStyling",i(t).attr("style")||"")}),e.$slider.addClass("slick-slider"),e.$slideTrack=0===e.slideCount?i('<div class="slick-track"/>').appendTo(e.$slider):e.$slides.wrapAll('<div class="slick-track"/>').parent(),e.$list=e.$slideTrack.wrap('<div class="slick-list"/>').parent(),e.$slideTrack.css("opacity",0),!0!==e.options.centerMode&&!0!==e.options.swipeToSlide||(e.options.slidesToScroll=1),i("img[data-lazy]",e.$slider).not("[src]").addClass("slick-loading"),e.setupInfinite(),e.buildArrows(),e.buildDots(),e.updateDots(),e.setSlideClasses("number"==typeof e.currentSlide?e.currentSlide:0),!0===e.options.draggable&&e.$list.addClass("draggable")},e.prototype.buildRows=function(){var i,e,t,o,s,n,r,l=this;if(o=document.createDocumentFragment(),n=l.$slider.children(),l.options.rows>1){for(r=l.options.slidesPerRow*l.options.rows,s=Math.ceil(n.length/r),i=0;i<s;i++){var d=document.createElement("div");for(e=0;e<l.options.rows;e++){var a=document.createElement("div");for(t=0;t<l.options.slidesPerRow;t++){var c=i*r+(e*l.options.slidesPerRow+t);n.get(c)&&a.appendChild(n.get(c))}d.appendChild(a)}o.appendChild(d)}l.$slider.empty().append(o),l.$slider.children().children().children().css({width:100/l.options.slidesPerRow+"%",display:"inline-block"})}},e.prototype.checkResponsive=function(e,t){var o,s,n,r=this,l=!1,d=r.$slider.width(),a=window.innerWidth||i(window).width();if("window"===r.respondTo?n=a:"slider"===r.respondTo?n=d:"min"===r.respondTo&&(n=Math.min(a,d)),r.options.responsive&&r.options.responsive.length&&null!==r.options.responsive){s=null;for(o in r.breakpoints)r.breakpoints.hasOwnProperty(o)&&(!1===r.originalSettings.mobileFirst?n<r.breakpoints[o]&&(s=r.breakpoints[o]):n>r.breakpoints[o]&&(s=r.breakpoints[o]));null!==s?null!==r.activeBreakpoint?(s!==r.activeBreakpoint||t)&&(r.activeBreakpoint=s,"unslick"===r.breakpointSettings[s]?r.unslick(s):(r.options=i.extend({},r.originalSettings,r.breakpointSettings[s]),!0===e&&(r.currentSlide=r.options.initialSlide),r.refresh(e)),l=s):(r.activeBreakpoint=s,"unslick"===r.breakpointSettings[s]?r.unslick(s):(r.options=i.extend({},r.originalSettings,r.breakpointSettings[s]),!0===e&&(r.currentSlide=r.options.initialSlide),r.refresh(e)),l=s):null!==r.activeBreakpoint&&(r.activeBreakpoint=null,r.options=r.originalSettings,!0===e&&(r.currentSlide=r.options.initialSlide),r.refresh(e),l=s),e||!1===l||r.$slider.trigger("breakpoint",[r,l])}},e.prototype.changeSlide=function(e,t){var o,s,n,r=this,l=i(e.currentTarget);switch(l.is("a")&&e.preventDefault(),l.is("li")||(l=l.closest("li")),n=r.slideCount%r.options.slidesToScroll!=0,o=n?0:(r.slideCount-r.currentSlide)%r.options.slidesToScroll,e.data.message){case"previous":s=0===o?r.options.slidesToScroll:r.options.slidesToShow-o,r.slideCount>r.options.slidesToShow&&r.slideHandler(r.currentSlide-s,!1,t);break;case"next":s=0===o?r.options.slidesToScroll:o,r.slideCount>r.options.slidesToShow&&r.slideHandler(r.currentSlide+s,!1,t);break;case"index":var d=0===e.data.index?0:e.data.index||l.index()*r.options.slidesToScroll;r.slideHandler(r.checkNavigable(d),!1,t),l.children().trigger("focus");break;default:return}},e.prototype.checkNavigable=function(i){var e,t;if(e=this.getNavigableIndexes(),t=0,i>e[e.length-1])i=e[e.length-1];else for(var o in e){if(i<e[o]){i=t;break}t=e[o]}return i},e.prototype.cleanUpEvents=function(){var e=this;e.options.dots&&null!==e.$dots&&(i("li",e.$dots).off("click.slick",e.changeSlide).off("mouseenter.slick",i.proxy(e.interrupt,e,!0)).off("mouseleave.slick",i.proxy(e.interrupt,e,!1)),!0===e.options.accessibility&&e.$dots.off("keydown.slick",e.keyHandler)),e.$slider.off("focus.slick blur.slick"),!0===e.options.arrows&&e.slideCount>e.options.slidesToShow&&(e.$prevArrow&&e.$prevArrow.off("click.slick",e.changeSlide),e.$nextArrow&&e.$nextArrow.off("click.slick",e.changeSlide),!0===e.options.accessibility&&(e.$prevArrow&&e.$prevArrow.off("keydown.slick",e.keyHandler),e.$nextArrow&&e.$nextArrow.off("keydown.slick",e.keyHandler))),e.$list.off("touchstart.slick mousedown.slick",e.swipeHandler),e.$list.off("touchmove.slick mousemove.slick",e.swipeHandler),e.$list.off("touchend.slick mouseup.slick",e.swipeHandler),e.$list.off("touchcancel.slick mouseleave.slick",e.swipeHandler),e.$list.off("click.slick",e.clickHandler),i(document).off(e.visibilityChange,e.visibility),e.cleanUpSlideEvents(),!0===e.options.accessibility&&e.$list.off("keydown.slick",e.keyHandler),!0===e.options.focusOnSelect&&i(e.$slideTrack).children().off("click.slick",e.selectHandler),i(window).off("orientationchange.slick.slick-"+e.instanceUid,e.orientationChange),i(window).off("resize.slick.slick-"+e.instanceUid,e.resize),i("[draggable!=true]",e.$slideTrack).off("dragstart",e.preventDefault),i(window).off("load.slick.slick-"+e.instanceUid,e.setPosition)},e.prototype.cleanUpSlideEvents=function(){var e=this;e.$list.off("mouseenter.slick",i.proxy(e.interrupt,e,!0)),e.$list.off("mouseleave.slick",i.proxy(e.interrupt,e,!1))},e.prototype.cleanUpRows=function(){var i,e=this;e.options.rows>1&&((i=e.$slides.children().children()).removeAttr("style"),e.$slider.empty().append(i))},e.prototype.clickHandler=function(i){!1===this.shouldClick&&(i.stopImmediatePropagation(),i.stopPropagation(),i.preventDefault())},e.prototype.destroy=function(e){var t=this;t.autoPlayClear(),t.touchObject={},t.cleanUpEvents(),i(".slick-cloned",t.$slider).detach(),t.$dots&&t.$dots.remove(),t.$prevArrow&&t.$prevArrow.length&&(t.$prevArrow.removeClass("slick-disabled slick-arrow slick-hidden").removeAttr("aria-hidden aria-disabled tabindex").css("display",""),t.htmlExpr.test(t.options.prevArrow)&&t.$prevArrow.remove()),t.$nextArrow&&t.$nextArrow.length&&(t.$nextArrow.removeClass("slick-disabled slick-arrow slick-hidden").removeAttr("aria-hidden aria-disabled tabindex").css("display",""),t.htmlExpr.test(t.options.nextArrow)&&t.$nextArrow.remove()),t.$slides&&(t.$slides.removeClass("slick-slide slick-active slick-center slick-visible slick-current").removeAttr("aria-hidden").removeAttr("data-slick-index").each(function(){i(this).attr("style",i(this).data("originalStyling"))}),t.$slideTrack.children(this.options.slide).detach(),t.$slideTrack.detach(),t.$list.detach(),t.$slider.append(t.$slides)),t.cleanUpRows(),t.$slider.removeClass("slick-slider"),t.$slider.removeClass("slick-initialized"),t.$slider.removeClass("slick-dotted"),t.unslicked=!0,e||t.$slider.trigger("destroy",[t])},e.prototype.disableTransition=function(i){var e=this,t={};t[e.transitionType]="",!1===e.options.fade?e.$slideTrack.css(t):e.$slides.eq(i).css(t)},e.prototype.fadeSlide=function(i,e){var t=this;!1===t.cssTransitions?(t.$slides.eq(i).css({zIndex:t.options.zIndex}),t.$slides.eq(i).animate({opacity:1},t.options.speed,t.options.easing,e)):(t.applyTransition(i),t.$slides.eq(i).css({opacity:1,zIndex:t.options.zIndex}),e&&setTimeout(function(){t.disableTransition(i),e.call()},t.options.speed))},e.prototype.fadeSlideOut=function(i){var e=this;!1===e.cssTransitions?e.$slides.eq(i).animate({opacity:0,zIndex:e.options.zIndex-2},e.options.speed,e.options.easing):(e.applyTransition(i),e.$slides.eq(i).css({opacity:0,zIndex:e.options.zIndex-2}))},e.prototype.filterSlides=e.prototype.slickFilter=function(i){var e=this;null!==i&&(e.$slidesCache=e.$slides,e.unload(),e.$slideTrack.children(this.options.slide).detach(),e.$slidesCache.filter(i).appendTo(e.$slideTrack),e.reinit())},e.prototype.focusHandler=function(){var e=this;e.$slider.off("focus.slick blur.slick").on("focus.slick blur.slick","*",function(t){t.stopImmediatePropagation();var o=i(this);setTimeout(function(){e.options.pauseOnFocus&&(e.focussed=o.is(":focus"),e.autoPlay())},0)})},e.prototype.getCurrent=e.prototype.slickCurrentSlide=function(){return this.currentSlide},e.prototype.getDotCount=function(){var i=this,e=0,t=0,o=0;if(!0===i.options.infinite)if(i.slideCount<=i.options.slidesToShow)++o;else for(;e<i.slideCount;)++o,e=t+i.options.slidesToScroll,t+=i.options.slidesToScroll<=i.options.slidesToShow?i.options.slidesToScroll:i.options.slidesToShow;else if(!0===i.options.centerMode)o=i.slideCount;else if(i.options.asNavFor)for(;e<i.slideCount;)++o,e=t+i.options.slidesToScroll,t+=i.options.slidesToScroll<=i.options.slidesToShow?i.options.slidesToScroll:i.options.slidesToShow;else o=1+Math.ceil((i.slideCount-i.options.slidesToShow)/i.options.slidesToScroll);return o-1},e.prototype.getLeft=function(i){var e,t,o,s,n=this,r=0;return n.slideOffset=0,t=n.$slides.first().outerHeight(!0),!0===n.options.infinite?(n.slideCount>n.options.slidesToShow&&(n.slideOffset=n.slideWidth*n.options.slidesToShow*-1,s=-1,!0===n.options.vertical&&!0===n.options.centerMode&&(2===n.options.slidesToShow?s=-1.5:1===n.options.slidesToShow&&(s=-2)),r=t*n.options.slidesToShow*s),n.slideCount%n.options.slidesToScroll!=0&&i+n.options.slidesToScroll>n.slideCount&&n.slideCount>n.options.slidesToShow&&(i>n.slideCount?(n.slideOffset=(n.options.slidesToShow-(i-n.slideCount))*n.slideWidth*-1,r=(n.options.slidesToShow-(i-n.slideCount))*t*-1):(n.slideOffset=n.slideCount%n.options.slidesToScroll*n.slideWidth*-1,r=n.slideCount%n.options.slidesToScroll*t*-1))):i+n.options.slidesToShow>n.slideCount&&(n.slideOffset=(i+n.options.slidesToShow-n.slideCount)*n.slideWidth,r=(i+n.options.slidesToShow-n.slideCount)*t),n.slideCount<=n.options.slidesToShow&&(n.slideOffset=0,r=0),!0===n.options.centerMode&&n.slideCount<=n.options.slidesToShow?n.slideOffset=n.slideWidth*Math.floor(n.options.slidesToShow)/2-n.slideWidth*n.slideCount/2:!0===n.options.centerMode&&!0===n.options.infinite?n.slideOffset+=n.slideWidth*Math.floor(n.options.slidesToShow/2)-n.slideWidth:!0===n.options.centerMode&&(n.slideOffset=0,n.slideOffset+=n.slideWidth*Math.floor(n.options.slidesToShow/2)),e=!1===n.options.vertical?i*n.slideWidth*-1+n.slideOffset:i*t*-1+r,!0===n.options.variableWidth&&(o=n.slideCount<=n.options.slidesToShow||!1===n.options.infinite?n.$slideTrack.children(".slick-slide").eq(i):n.$slideTrack.children(".slick-slide").eq(i+n.options.slidesToShow),e=!0===n.options.rtl?o[0]?-1*(n.$slideTrack.width()-o[0].offsetLeft-o.width()):0:o[0]?-1*o[0].offsetLeft:0,!0===n.options.centerMode&&(o=n.slideCount<=n.options.slidesToShow||!1===n.options.infinite?n.$slideTrack.children(".slick-slide").eq(i):n.$slideTrack.children(".slick-slide").eq(i+n.options.slidesToShow+1),e=!0===n.options.rtl?o[0]?-1*(n.$slideTrack.width()-o[0].offsetLeft-o.width()):0:o[0]?-1*o[0].offsetLeft:0,e+=(n.$list.width()-o.outerWidth())/2)),e},e.prototype.getOption=e.prototype.slickGetOption=function(i){return this.options[i]},e.prototype.getNavigableIndexes=function(){var i,e=this,t=0,o=0,s=[];for(!1===e.options.infinite?i=e.slideCount:(t=-1*e.options.slidesToScroll,o=-1*e.options.slidesToScroll,i=2*e.slideCount);t<i;)s.push(t),t=o+e.options.slidesToScroll,o+=e.options.slidesToScroll<=e.options.slidesToShow?e.options.slidesToScroll:e.options.slidesToShow;return s},e.prototype.getSlick=function(){return this},e.prototype.getSlideCount=function(){var e,t,o=this;return t=!0===o.options.centerMode?o.slideWidth*Math.floor(o.options.slidesToShow/2):0,!0===o.options.swipeToSlide?(o.$slideTrack.find(".slick-slide").each(function(s,n){if(n.offsetLeft-t+i(n).outerWidth()/2>-1*o.swipeLeft)return e=n,!1}),Math.abs(i(e).attr("data-slick-index")-o.currentSlide)||1):o.options.slidesToScroll},e.prototype.goTo=e.prototype.slickGoTo=function(i,e){this.changeSlide({data:{message:"index",index:parseInt(i)}},e)},e.prototype.init=function(e){var t=this;i(t.$slider).hasClass("slick-initialized")||(i(t.$slider).addClass("slick-initialized"),t.buildRows(),t.buildOut(),t.setProps(),t.startLoad(),t.loadSlider(),t.initializeEvents(),t.updateArrows(),t.updateDots(),t.checkResponsive(!0),t.focusHandler()),e&&t.$slider.trigger("init",[t]),!0===t.options.accessibility&&t.initADA(),t.options.autoplay&&(t.paused=!1,t.autoPlay())},e.prototype.initADA=function(){var e=this,t=Math.ceil(e.slideCount/e.options.slidesToShow),o=e.getNavigableIndexes().filter(function(i){return i>=0&&i<e.slideCount});e.$slides.add(e.$slideTrack.find(".slick-cloned")).attr({"aria-hidden":"true",tabindex:"-1"}).find("a, input, button, select").attr({tabindex:"-1"}),null!==e.$dots&&(e.$slides.not(e.$slideTrack.find(".slick-cloned")).each(function(t){var s=o.indexOf(t);i(this).attr({role:"tabpanel",id:"slick-slide"+e.instanceUid+t,tabindex:-1}),-1!==s&&i(this).attr({"aria-describedby":"slick-slide-control"+e.instanceUid+s})}),e.$dots.attr("role","tablist").find("li").each(function(s){var n=o[s];i(this).attr({role:"presentation"}),i(this).find("button").first().attr({role:"tab",id:"slick-slide-control"+e.instanceUid+s,"aria-controls":"slick-slide"+e.instanceUid+n,"aria-label":s+1+" of "+t,"aria-selected":null,tabindex:"-1"})}).eq(e.currentSlide).find("button").attr({"aria-selected":"true",tabindex:"0"}).end());for(var s=e.currentSlide,n=s+e.options.slidesToShow;s<n;s++)e.$slides.eq(s).attr("tabindex",0);e.activateADA()},e.prototype.initArrowEvents=function(){var i=this;!0===i.options.arrows&&i.slideCount>i.options.slidesToShow&&(i.$prevArrow.off("click.slick").on("click.slick",{message:"previous"},i.changeSlide),i.$nextArrow.off("click.slick").on("click.slick",{message:"next"},i.changeSlide),!0===i.options.accessibility&&(i.$prevArrow.on("keydown.slick",i.keyHandler),i.$nextArrow.on("keydown.slick",i.keyHandler)))},e.prototype.initDotEvents=function(){var e=this;!0===e.options.dots&&(i("li",e.$dots).on("click.slick",{message:"index"},e.changeSlide),!0===e.options.accessibility&&e.$dots.on("keydown.slick",e.keyHandler)),!0===e.options.dots&&!0===e.options.pauseOnDotsHover&&i("li",e.$dots).on("mouseenter.slick",i.proxy(e.interrupt,e,!0)).on("mouseleave.slick",i.proxy(e.interrupt,e,!1))},e.prototype.initSlideEvents=function(){var e=this;e.options.pauseOnHover&&(e.$list.on("mouseenter.slick",i.proxy(e.interrupt,e,!0)),e.$list.on("mouseleave.slick",i.proxy(e.interrupt,e,!1)))},e.prototype.initializeEvents=function(){var e=this;e.initArrowEvents(),e.initDotEvents(),e.initSlideEvents(),e.$list.on("touchstart.slick mousedown.slick",{action:"start"},e.swipeHandler),e.$list.on("touchmove.slick mousemove.slick",{action:"move"},e.swipeHandler),e.$list.on("touchend.slick mouseup.slick",{action:"end"},e.swipeHandler),e.$list.on("touchcancel.slick mouseleave.slick",{action:"end"},e.swipeHandler),e.$list.on("click.slick",e.clickHandler),i(document).on(e.visibilityChange,i.proxy(e.visibility,e)),!0===e.options.accessibility&&e.$list.on("keydown.slick",e.keyHandler),!0===e.options.focusOnSelect&&i(e.$slideTrack).children().on("click.slick",e.selectHandler),i(window).on("orientationchange.slick.slick-"+e.instanceUid,i.proxy(e.orientationChange,e)),i(window).on("resize.slick.slick-"+e.instanceUid,i.proxy(e.resize,e)),i("[draggable!=true]",e.$slideTrack).on("dragstart",e.preventDefault),i(window).on("load.slick.slick-"+e.instanceUid,e.setPosition),i(e.setPosition)},e.prototype.initUI=function(){var i=this;!0===i.options.arrows&&i.slideCount>i.options.slidesToShow&&(i.$prevArrow.show(),i.$nextArrow.show()),!0===i.options.dots&&i.slideCount>i.options.slidesToShow&&i.$dots.show()},e.prototype.keyHandler=function(i){var e=this;i.target.tagName.match("TEXTAREA|INPUT|SELECT")||(37===i.keyCode&&!0===e.options.accessibility?e.changeSlide({data:{message:!0===e.options.rtl?"next":"previous"}}):39===i.keyCode&&!0===e.options.accessibility&&e.changeSlide({data:{message:!0===e.options.rtl?"previous":"next"}}))},e.prototype.lazyLoad=function(){function e(e){i("img[data-lazy]",e).each(function(){var e=i(this),t=i(this).attr("data-lazy"),o=i(this).attr("data-srcset"),s=i(this).attr("data-sizes")||n.$slider.attr("data-sizes"),r=document.createElement("img");r.onload=function(){e.animate({opacity:0},100,function(){o&&(e.attr("srcset",o),s&&e.attr("sizes",s)),e.attr("src",t).animate({opacity:1},200,function(){e.removeAttr("data-lazy data-srcset data-sizes").removeClass("slick-loading")}),n.$slider.trigger("lazyLoaded",[n,e,t])})},r.onerror=function(){e.removeAttr("data-lazy").removeClass("slick-loading").addClass("slick-lazyload-error"),n.$slider.trigger("lazyLoadError",[n,e,t])},r.src=t})}var t,o,s,n=this;if(!0===n.options.centerMode?!0===n.options.infinite?s=(o=n.currentSlide+(n.options.slidesToShow/2+1))+n.options.slidesToShow+2:(o=Math.max(0,n.currentSlide-(n.options.slidesToShow/2+1)),s=n.options.slidesToShow/2+1+2+n.currentSlide):(o=n.options.infinite?n.options.slidesToShow+n.currentSlide:n.currentSlide,s=Math.ceil(o+n.options.slidesToShow),!0===n.options.fade&&(o>0&&o--,s<=n.slideCount&&s++)),t=n.$slider.find(".slick-slide").slice(o,s),"anticipated"===n.options.lazyLoad)for(var r=o-1,l=s,d=n.$slider.find(".slick-slide"),a=0;a<n.options.slidesToScroll;a++)r<0&&(r=n.slideCount-1),t=(t=t.add(d.eq(r))).add(d.eq(l)),r--,l++;e(t),n.slideCount<=n.options.slidesToShow?e(n.$slider.find(".slick-slide")):n.currentSlide>=n.slideCount-n.options.slidesToShow?e(n.$slider.find(".slick-cloned").slice(0,n.options.slidesToShow)):0===n.currentSlide&&e(n.$slider.find(".slick-cloned").slice(-1*n.options.slidesToShow))},e.prototype.loadSlider=function(){var i=this;i.setPosition(),i.$slideTrack.css({opacity:1}),i.$slider.removeClass("slick-loading"),i.initUI(),"progressive"===i.options.lazyLoad&&i.progressiveLazyLoad()},e.prototype.next=e.prototype.slickNext=function(){this.changeSlide({data:{message:"next"}})},e.prototype.orientationChange=function(){var i=this;i.checkResponsive(),i.setPosition()},e.prototype.pause=e.prototype.slickPause=function(){var i=this;i.autoPlayClear(),i.paused=!0},e.prototype.play=e.prototype.slickPlay=function(){var i=this;i.autoPlay(),i.options.autoplay=!0,i.paused=!1,i.focussed=!1,i.interrupted=!1},e.prototype.postSlide=function(e){var t=this;t.unslicked||(t.$slider.trigger("afterChange",[t,e]),t.animating=!1,t.slideCount>t.options.slidesToShow&&t.setPosition(),t.swipeLeft=null,t.options.autoplay&&t.autoPlay(),!0===t.options.accessibility&&(t.initADA(),t.options.focusOnChange&&i(t.$slides.get(t.currentSlide)).attr("tabindex",0).focus()))},e.prototype.prev=e.prototype.slickPrev=function(){this.changeSlide({data:{message:"previous"}})},e.prototype.preventDefault=function(i){i.preventDefault()},e.prototype.progressiveLazyLoad=function(e){e=e||1;var t,o,s,n,r,l=this,d=i("img[data-lazy]",l.$slider);d.length?(t=d.first(),o=t.attr("data-lazy"),s=t.attr("data-srcset"),n=t.attr("data-sizes")||l.$slider.attr("data-sizes"),(r=document.createElement("img")).onload=function(){s&&(t.attr("srcset",s),n&&t.attr("sizes",n)),t.attr("src",o).removeAttr("data-lazy data-srcset data-sizes").removeClass("slick-loading"),!0===l.options.adaptiveHeight&&l.setPosition(),l.$slider.trigger("lazyLoaded",[l,t,o]),l.progressiveLazyLoad()},r.onerror=function(){e<3?setTimeout(function(){l.progressiveLazyLoad(e+1)},500):(t.removeAttr("data-lazy").removeClass("slick-loading").addClass("slick-lazyload-error"),l.$slider.trigger("lazyLoadError",[l,t,o]),l.progressiveLazyLoad())},r.src=o):l.$slider.trigger("allImagesLoaded",[l])},e.prototype.refresh=function(e){var t,o,s=this;o=s.slideCount-s.options.slidesToShow,!s.options.infinite&&s.currentSlide>o&&(s.currentSlide=o),s.slideCount<=s.options.slidesToShow&&(s.currentSlide=0),t=s.currentSlide,s.destroy(!0),i.extend(s,s.initials,{currentSlide:t}),s.init(),e||s.changeSlide({data:{message:"index",index:t}},!1)},e.prototype.registerBreakpoints=function(){var e,t,o,s=this,n=s.options.responsive||null;if("array"===i.type(n)&&n.length){s.respondTo=s.options.respondTo||"window";for(e in n)if(o=s.breakpoints.length-1,n.hasOwnProperty(e)){for(t=n[e].breakpoint;o>=0;)s.breakpoints[o]&&s.breakpoints[o]===t&&s.breakpoints.splice(o,1),o--;s.breakpoints.push(t),s.breakpointSettings[t]=n[e].settings}s.breakpoints.sort(function(i,e){return s.options.mobileFirst?i-e:e-i})}},e.prototype.reinit=function(){var e=this;e.$slides=e.$slideTrack.children(e.options.slide).addClass("slick-slide"),e.slideCount=e.$slides.length,e.currentSlide>=e.slideCount&&0!==e.currentSlide&&(e.currentSlide=e.currentSlide-e.options.slidesToScroll),e.slideCount<=e.options.slidesToShow&&(e.currentSlide=0),e.registerBreakpoints(),e.setProps(),e.setupInfinite(),e.buildArrows(),e.updateArrows(),e.initArrowEvents(),e.buildDots(),e.updateDots(),e.initDotEvents(),e.cleanUpSlideEvents(),e.initSlideEvents(),e.checkResponsive(!1,!0),!0===e.options.focusOnSelect&&i(e.$slideTrack).children().on("click.slick",e.selectHandler),e.setSlideClasses("number"==typeof e.currentSlide?e.currentSlide:0),e.setPosition(),e.focusHandler(),e.paused=!e.options.autoplay,e.autoPlay(),e.$slider.trigger("reInit",[e])},e.prototype.resize=function(){var e=this;i(window).width()!==e.windowWidth&&(clearTimeout(e.windowDelay),e.windowDelay=window.setTimeout(function(){e.windowWidth=i(window).width(),e.checkResponsive(),e.unslicked||e.setPosition()},50))},e.prototype.removeSlide=e.prototype.slickRemove=function(i,e,t){var o=this;if(i="boolean"==typeof i?!0===(e=i)?0:o.slideCount-1:!0===e?--i:i,o.slideCount<1||i<0||i>o.slideCount-1)return!1;o.unload(),!0===t?o.$slideTrack.children().remove():o.$slideTrack.children(this.options.slide).eq(i).remove(),o.$slides=o.$slideTrack.children(this.options.slide),o.$slideTrack.children(this.options.slide).detach(),o.$slideTrack.append(o.$slides),o.$slidesCache=o.$slides,o.reinit()},e.prototype.setCSS=function(i){var e,t,o=this,s={};!0===o.options.rtl&&(i=-i),e="left"==o.positionProp?Math.ceil(i)+"px":"0px",t="top"==o.positionProp?Math.ceil(i)+"px":"0px",s[o.positionProp]=i,!1===o.transformsEnabled?o.$slideTrack.css(s):(s={},!1===o.cssTransitions?(s[o.animType]="translate("+e+", "+t+")",o.$slideTrack.css(s)):(s[o.animType]="translate3d("+e+", "+t+", 0px)",o.$slideTrack.css(s)))},e.prototype.setDimensions=function(){var i=this;!1===i.options.vertical?!0===i.options.centerMode&&i.$list.css({padding:"0px "+i.options.centerPadding}):(i.$list.height(i.$slides.first().outerHeight(!0)*i.options.slidesToShow),!0===i.options.centerMode&&i.$list.css({padding:i.options.centerPadding+" 0px"})),i.listWidth=i.$list.width(),i.listHeight=i.$list.height(),!1===i.options.vertical&&!1===i.options.variableWidth?(i.slideWidth=Math.ceil(i.listWidth/i.options.slidesToShow),i.$slideTrack.width(Math.ceil(i.slideWidth*i.$slideTrack.children(".slick-slide").length))):!0===i.options.variableWidth?i.$slideTrack.width(5e3*i.slideCount):(i.slideWidth=Math.ceil(i.listWidth),i.$slideTrack.height(Math.ceil(i.$slides.first().outerHeight(!0)*i.$slideTrack.children(".slick-slide").length)));var e=i.$slides.first().outerWidth(!0)-i.$slides.first().width();!1===i.options.variableWidth&&i.$slideTrack.children(".slick-slide").width(i.slideWidth-e)},e.prototype.setFade=function(){var e,t=this;t.$slides.each(function(o,s){e=t.slideWidth*o*-1,!0===t.options.rtl?i(s).css({position:"relative",right:e,top:0,zIndex:t.options.zIndex-2,opacity:0}):i(s).css({position:"relative",left:e,top:0,zIndex:t.options.zIndex-2,opacity:0})}),t.$slides.eq(t.currentSlide).css({zIndex:t.options.zIndex-1,opacity:1})},e.prototype.setHeight=function(){var i=this;if(1===i.options.slidesToShow&&!0===i.options.adaptiveHeight&&!1===i.options.vertical){var e=i.$slides.eq(i.currentSlide).outerHeight(!0);i.$list.css("height",e)}},e.prototype.setOption=e.prototype.slickSetOption=function(){var e,t,o,s,n,r=this,l=!1;if("object"===i.type(arguments[0])?(o=arguments[0],l=arguments[1],n="multiple"):"string"===i.type(arguments[0])&&(o=arguments[0],s=arguments[1],l=arguments[2],"responsive"===arguments[0]&&"array"===i.type(arguments[1])?n="responsive":void 0!==arguments[1]&&(n="single")),"single"===n)r.options[o]=s;else if("multiple"===n)i.each(o,function(i,e){r.options[i]=e});else if("responsive"===n)for(t in s)if("array"!==i.type(r.options.responsive))r.options.responsive=[s[t]];else{for(e=r.options.responsive.length-1;e>=0;)r.options.responsive[e].breakpoint===s[t].breakpoint&&r.options.responsive.splice(e,1),e--;r.options.responsive.push(s[t])}l&&(r.unload(),r.reinit())},e.prototype.setPosition=function(){var i=this;i.setDimensions(),i.setHeight(),!1===i.options.fade?i.setCSS(i.getLeft(i.currentSlide)):i.setFade(),i.$slider.trigger("setPosition",[i])},e.prototype.setProps=function(){var i=this,e=document.body.style;i.positionProp=!0===i.options.vertical?"top":"left","top"===i.positionProp?i.$slider.addClass("slick-vertical"):i.$slider.removeClass("slick-vertical"),void 0===e.WebkitTransition&&void 0===e.MozTransition&&void 0===e.msTransition||!0===i.options.useCSS&&(i.cssTransitions=!0),i.options.fade&&("number"==typeof i.options.zIndex?i.options.zIndex<3&&(i.options.zIndex=3):i.options.zIndex=i.defaults.zIndex),void 0!==e.OTransform&&(i.animType="OTransform",i.transformType="-o-transform",i.transitionType="OTransition",void 0===e.perspectiveProperty&&void 0===e.webkitPerspective&&(i.animType=!1)),void 0!==e.MozTransform&&(i.animType="MozTransform",i.transformType="-moz-transform",i.transitionType="MozTransition",void 0===e.perspectiveProperty&&void 0===e.MozPerspective&&(i.animType=!1)),void 0!==e.webkitTransform&&(i.animType="webkitTransform",i.transformType="-webkit-transform",i.transitionType="webkitTransition",void 0===e.perspectiveProperty&&void 0===e.webkitPerspective&&(i.animType=!1)),void 0!==e.msTransform&&(i.animType="msTransform",i.transformType="-ms-transform",i.transitionType="msTransition",void 0===e.msTransform&&(i.animType=!1)),void 0!==e.transform&&!1!==i.animType&&(i.animType="transform",i.transformType="transform",i.transitionType="transition"),i.transformsEnabled=i.options.useTransform&&null!==i.animType&&!1!==i.animType},e.prototype.setSlideClasses=function(i){var e,t,o,s,n=this;if(t=n.$slider.find(".slick-slide").removeClass("slick-active slick-center slick-current").attr("aria-hidden","true"),n.$slides.eq(i).addClass("slick-current"),!0===n.options.centerMode){var r=n.options.slidesToShow%2==0?1:0;e=Math.floor(n.options.slidesToShow/2),!0===n.options.infinite&&(i>=e&&i<=n.slideCount-1-e?n.$slides.slice(i-e+r,i+e+1).addClass("slick-active").attr("aria-hidden","false"):(o=n.options.slidesToShow+i,t.slice(o-e+1+r,o+e+2).addClass("slick-active").attr("aria-hidden","false")),0===i?t.eq(t.length-1-n.options.slidesToShow).addClass("slick-center"):i===n.slideCount-1&&t.eq(n.options.slidesToShow).addClass("slick-center")),n.$slides.eq(i).addClass("slick-center")}else i>=0&&i<=n.slideCount-n.options.slidesToShow?n.$slides.slice(i,i+n.options.slidesToShow).addClass("slick-active").attr("aria-hidden","false"):t.length<=n.options.slidesToShow?t.addClass("slick-active").attr("aria-hidden","false"):(s=n.slideCount%n.options.slidesToShow,o=!0===n.options.infinite?n.options.slidesToShow+i:i,n.options.slidesToShow==n.options.slidesToScroll&&n.slideCount-i<n.options.slidesToShow?t.slice(o-(n.options.slidesToShow-s),o+s).addClass("slick-active").attr("aria-hidden","false"):t.slice(o,o+n.options.slidesToShow).addClass("slick-active").attr("aria-hidden","false"));"ondemand"!==n.options.lazyLoad&&"anticipated"!==n.options.lazyLoad||n.lazyLoad()},e.prototype.setupInfinite=function(){var e,t,o,s=this;if(!0===s.options.fade&&(s.options.centerMode=!1),!0===s.options.infinite&&!1===s.options.fade&&(t=null,s.slideCount>s.options.slidesToShow)){for(o=!0===s.options.centerMode?s.options.slidesToShow+1:s.options.slidesToShow,e=s.slideCount;e>s.slideCount-o;e-=1)t=e-1,i(s.$slides[t]).clone(!0).attr("id","").attr("data-slick-index",t-s.slideCount).prependTo(s.$slideTrack).addClass("slick-cloned");for(e=0;e<o+s.slideCount;e+=1)t=e,i(s.$slides[t]).clone(!0).attr("id","").attr("data-slick-index",t+s.slideCount).appendTo(s.$slideTrack).addClass("slick-cloned");s.$slideTrack.find(".slick-cloned").find("[id]").each(function(){i(this).attr("id","")})}},e.prototype.interrupt=function(i){var e=this;i||e.autoPlay(),e.interrupted=i},e.prototype.selectHandler=function(e){var t=this,o=i(e.target).is(".slick-slide")?i(e.target):i(e.target).parents(".slick-slide"),s=parseInt(o.attr("data-slick-index"));s||(s=0),t.slideCount<=t.options.slidesToShow?t.slideHandler(s,!1,!0):t.slideHandler(s)},e.prototype.slideHandler=function(i,e,t){var o,s,n,r,l,d=null,a=this;if(e=e||!1,!(!0===a.animating&&!0===a.options.waitForAnimate||!0===a.options.fade&&a.currentSlide===i))if(!1===e&&a.asNavFor(i),o=i,d=a.getLeft(o),r=a.getLeft(a.currentSlide),a.currentLeft=null===a.swipeLeft?r:a.swipeLeft,!1===a.options.infinite&&!1===a.options.centerMode&&(i<0||i>a.getDotCount()*a.options.slidesToScroll))!1===a.options.fade&&(o=a.currentSlide,!0!==t?a.animateSlide(r,function(){a.postSlide(o)}):a.postSlide(o));else if(!1===a.options.infinite&&!0===a.options.centerMode&&(i<0||i>a.slideCount-a.options.slidesToScroll))!1===a.options.fade&&(o=a.currentSlide,!0!==t?a.animateSlide(r,function(){a.postSlide(o)}):a.postSlide(o));else{if(a.options.autoplay&&clearInterval(a.autoPlayTimer),s=o<0?a.slideCount%a.options.slidesToScroll!=0?a.slideCount-a.slideCount%a.options.slidesToScroll:a.slideCount+o:o>=a.slideCount?a.slideCount%a.options.slidesToScroll!=0?0:o-a.slideCount:o,a.animating=!0,a.$slider.trigger("beforeChange",[a,a.currentSlide,s]),n=a.currentSlide,a.currentSlide=s,a.setSlideClasses(a.currentSlide),a.options.asNavFor&&(l=(l=a.getNavTarget()).slick("getSlick")).slideCount<=l.options.slidesToShow&&l.setSlideClasses(a.currentSlide),a.updateDots(),a.updateArrows(),!0===a.options.fade)return!0!==t?(a.fadeSlideOut(n),a.fadeSlide(s,function(){a.postSlide(s)})):a.postSlide(s),void a.animateHeight();!0!==t?a.animateSlide(d,function(){a.postSlide(s)}):a.postSlide(s)}},e.prototype.startLoad=function(){var i=this;!0===i.options.arrows&&i.slideCount>i.options.slidesToShow&&(i.$prevArrow.hide(),i.$nextArrow.hide()),!0===i.options.dots&&i.slideCount>i.options.slidesToShow&&i.$dots.hide(),i.$slider.addClass("slick-loading")},e.prototype.swipeDirection=function(){var i,e,t,o,s=this;return i=s.touchObject.startX-s.touchObject.curX,e=s.touchObject.startY-s.touchObject.curY,t=Math.atan2(e,i),(o=Math.round(180*t/Math.PI))<0&&(o=360-Math.abs(o)),o<=45&&o>=0?!1===s.options.rtl?"left":"right":o<=360&&o>=315?!1===s.options.rtl?"left":"right":o>=135&&o<=225?!1===s.options.rtl?"right":"left":!0===s.options.verticalSwiping?o>=35&&o<=135?"down":"up":"vertical"},e.prototype.swipeEnd=function(i){var e,t,o=this;if(o.dragging=!1,o.swiping=!1,o.scrolling)return o.scrolling=!1,!1;if(o.interrupted=!1,o.shouldClick=!(o.touchObject.swipeLength>10),void 0===o.touchObject.curX)return!1;if(!0===o.touchObject.edgeHit&&o.$slider.trigger("edge",[o,o.swipeDirection()]),o.touchObject.swipeLength>=o.touchObject.minSwipe){switch(t=o.swipeDirection()){case"left":case"down":e=o.options.swipeToSlide?o.checkNavigable(o.currentSlide+o.getSlideCount()):o.currentSlide+o.getSlideCount(),o.currentDirection=0;break;case"right":case"up":e=o.options.swipeToSlide?o.checkNavigable(o.currentSlide-o.getSlideCount()):o.currentSlide-o.getSlideCount(),o.currentDirection=1}"vertical"!=t&&(o.slideHandler(e),o.touchObject={},o.$slider.trigger("swipe",[o,t]))}else o.touchObject.startX!==o.touchObject.curX&&(o.slideHandler(o.currentSlide),o.touchObject={})},e.prototype.swipeHandler=function(i){var e=this;if(!(!1===e.options.swipe||"ontouchend"in document&&!1===e.options.swipe||!1===e.options.draggable&&-1!==i.type.indexOf("mouse")))switch(e.touchObject.fingerCount=i.originalEvent&&void 0!==i.originalEvent.touches?i.originalEvent.touches.length:1,e.touchObject.minSwipe=e.listWidth/e.options.touchThreshold,!0===e.options.verticalSwiping&&(e.touchObject.minSwipe=e.listHeight/e.options.touchThreshold),i.data.action){case"start":e.swipeStart(i);break;case"move":e.swipeMove(i);break;case"end":e.swipeEnd(i)}},e.prototype.swipeMove=function(i){var e,t,o,s,n,r,l=this;return n=void 0!==i.originalEvent?i.originalEvent.touches:null,!(!l.dragging||l.scrolling||n&&1!==n.length)&&(e=l.getLeft(l.currentSlide),l.touchObject.curX=void 0!==n?n[0].pageX:i.clientX,l.touchObject.curY=void 0!==n?n[0].pageY:i.clientY,l.touchObject.swipeLength=Math.round(Math.sqrt(Math.pow(l.touchObject.curX-l.touchObject.startX,2))),r=Math.round(Math.sqrt(Math.pow(l.touchObject.curY-l.touchObject.startY,2))),!l.options.verticalSwiping&&!l.swiping&&r>4?(l.scrolling=!0,!1):(!0===l.options.verticalSwiping&&(l.touchObject.swipeLength=r),t=l.swipeDirection(),void 0!==i.originalEvent&&l.touchObject.swipeLength>4&&(l.swiping=!0,i.preventDefault()),s=(!1===l.options.rtl?1:-1)*(l.touchObject.curX>l.touchObject.startX?1:-1),!0===l.options.verticalSwiping&&(s=l.touchObject.curY>l.touchObject.startY?1:-1),o=l.touchObject.swipeLength,l.touchObject.edgeHit=!1,!1===l.options.infinite&&(0===l.currentSlide&&"right"===t||l.currentSlide>=l.getDotCount()&&"left"===t)&&(o=l.touchObject.swipeLength*l.options.edgeFriction,l.touchObject.edgeHit=!0),!1===l.options.vertical?l.swipeLeft=e+o*s:l.swipeLeft=e+o*(l.$list.height()/l.listWidth)*s,!0===l.options.verticalSwiping&&(l.swipeLeft=e+o*s),!0!==l.options.fade&&!1!==l.options.touchMove&&(!0===l.animating?(l.swipeLeft=null,!1):void l.setCSS(l.swipeLeft))))},e.prototype.swipeStart=function(i){var e,t=this;if(t.interrupted=!0,1!==t.touchObject.fingerCount||t.slideCount<=t.options.slidesToShow)return t.touchObject={},!1;void 0!==i.originalEvent&&void 0!==i.originalEvent.touches&&(e=i.originalEvent.touches[0]),t.touchObject.startX=t.touchObject.curX=void 0!==e?e.pageX:i.clientX,t.touchObject.startY=t.touchObject.curY=void 0!==e?e.pageY:i.clientY,t.dragging=!0},e.prototype.unfilterSlides=e.prototype.slickUnfilter=function(){var i=this;null!==i.$slidesCache&&(i.unload(),i.$slideTrack.children(this.options.slide).detach(),i.$slidesCache.appendTo(i.$slideTrack),i.reinit())},e.prototype.unload=function(){var e=this;i(".slick-cloned",e.$slider).remove(),e.$dots&&e.$dots.remove(),e.$prevArrow&&e.htmlExpr.test(e.options.prevArrow)&&e.$prevArrow.remove(),e.$nextArrow&&e.htmlExpr.test(e.options.nextArrow)&&e.$nextArrow.remove(),e.$slides.removeClass("slick-slide slick-active slick-visible slick-current").attr("aria-hidden","true").css("width","")},e.prototype.unslick=function(i){var e=this;e.$slider.trigger("unslick",[e,i]),e.destroy()},e.prototype.updateArrows=function(){var i=this;Math.floor(i.options.slidesToShow/2),!0===i.options.arrows&&i.slideCount>i.options.slidesToShow&&!i.options.infinite&&(i.$prevArrow.removeClass("slick-disabled").attr("aria-disabled","false"),i.$nextArrow.removeClass("slick-disabled").attr("aria-disabled","false"),0===i.currentSlide?(i.$prevArrow.addClass("slick-disabled").attr("aria-disabled","true"),i.$nextArrow.removeClass("slick-disabled").attr("aria-disabled","false")):i.currentSlide>=i.slideCount-i.options.slidesToShow&&!1===i.options.centerMode?(i.$nextArrow.addClass("slick-disabled").attr("aria-disabled","true"),i.$prevArrow.removeClass("slick-disabled").attr("aria-disabled","false")):i.currentSlide>=i.slideCount-1&&!0===i.options.centerMode&&(i.$nextArrow.addClass("slick-disabled").attr("aria-disabled","true"),i.$prevArrow.removeClass("slick-disabled").attr("aria-disabled","false")))},e.prototype.updateDots=function(){var i=this;null!==i.$dots&&(i.$dots.find("li").removeClass("slick-active").end(),i.$dots.find("li").eq(Math.floor(i.currentSlide/i.options.slidesToScroll)).addClass("slick-active"))},e.prototype.visibility=function(){var i=this;i.options.autoplay&&(document[i.hidden]?i.interrupted=!0:i.interrupted=!1)},i.fn.slick=function(){var i,t,o=this,s=arguments[0],n=Array.prototype.slice.call(arguments,1),r=o.length;for(i=0;i<r;i++)if("object"==typeof s||void 0===s?o[i].slick=new e(o[i],s):t=o[i].slick[s].apply(o[i].slick,n),void 0!==t)return t;return o}});!function(a){a.fn.slickAnimation=function(){function n(a,n,t,i,o){o="undefined"!=typeof o?o:!1,1==n.opacity?(a.addClass(t),a.addClass(i)):(a.removeClass(t),a.removeClass(i)),o&&a.css(n)}function t(a,n){return a?1e3*a+1e3:n?1e3*n:a||n?1e3*a+1e3*n:1e3}function i(a,n,t){var i=["animation-"+n,"-webkit-animation-"+n,"-moz-animation-"+n,"-o-animation-"+n,"-ms-animation-"+n],o={}
+i.forEach(function(a){o[a]=t+"s"}),a.css(o)}var o=a(this),e=o.find(".slick-list .slick-track > div"),s=o.find('[data-slick-index="0"]'),r="animated",c={opacity:"1"},d={opacity:"0"}
+return e.each(function(){var e=a(this)
+e.find("[data-animation-in]").each(function(){var u=a(this)
+u.css(d)
+var l=u.attr("data-animation-in"),f=u.attr("data-animation-out"),h=u.attr("data-delay-in"),m=u.attr("data-duration-in"),y=u.attr("data-delay-out"),C=u.attr("data-duration-out")
+f?(s.length>0&&e.hasClass("slick-current")&&(n(u,c,l,r,!0),h&&i(u,"delay",h),m&&i(u,"duration",m),setTimeout(function(){n(u,d,l,r),n(u,c,f,r),y&&i(u,"delay",y),C&&i(u,"duration",C)},t(h,m))),o.on("afterChange",function(a,o,s){e.hasClass("slick-current")&&(n(u,c,l,r,!0),h&&i(u,"delay",h),m&&i(u,"duration",m),setTimeout(function(){n(u,d,l,r),n(u,c,f,r),y&&i(u,"delay",y),C&&i(u,"duration",C)},t(h,m)))}),o.on("beforeChange",function(a,t,i){n(u,d,f,r,!0)})):(s.length>0&&e.hasClass("slick-current")&&(n(u,c,l,r,!0),h&&i(u,"delay",h),m&&i(u,"duration",m)),o.on("afterChange",function(a,t,o){e.hasClass("slick-current")&&(n(u,c,l,r,!0),h&&i(u,"delay",h),m&&i(u,"duration",m))}),o.on("beforeChange",function(a,t,i){n(u,d,l,r,!0)}))})}),this}}(jQuery)
\ No newline at end of file
diff --git a/plugins/venobox/venobox.css b/plugins/venobox/venobox.css
new file mode 100644
index 00000000..abf3cc86
--- /dev/null
+++ b/plugins/venobox/venobox.css
@@ -0,0 +1,227 @@
+/* ------ venobox.css --------*/
+.vbox-overlay *, .vbox-overlay *:before, .vbox-overlay *:after{
+    -webkit-backface-visibility: hidden;
+    -webkit-box-sizing:border-box;
+    -moz-box-sizing:border-box;
+    box-sizing:border-box;
+
+}
+.vbox-overlay{
+    display: -webkit-flex;
+    display: flex;
+    -webkit-flex-direction: column;
+    flex-direction: column;
+    -webkit-justify-content: center;
+    justify-content: center;
+    -webkit-align-items: center;
+    align-items: center;
+    position: fixed;
+    left: 0;
+    top: 0;
+    bottom: 0;
+    right: 0;
+    z-index: 1040;
+    -webkit-transform:translateZ(1000px);
+    transform: translateZ(1000px);
+    transform-style: preserve-3d;
+}
+
+/* ----- navigation ----- */
+.vbox-title{
+    width: 100%;
+    height: 40px;
+    float: left;
+    text-align: center;
+    line-height: 28px;
+    font-size: 12px;
+    padding: 6px 40px;
+    overflow: hidden;
+    position: fixed;
+    display: none;
+    left: 0;
+    z-index: 1050;
+}
+.vbox-close{
+    cursor: pointer;
+    position: fixed;
+    top: -1px;
+    right: 0;
+    width: 50px;
+    height: 40px;
+    padding: 6px;
+    display: block;
+    background-position:10px center;
+    overflow: hidden;
+    font-size: 24px;
+    line-height: 1;
+    text-align: center;
+    z-index: 1050;
+}
+.vbox-num{
+    cursor: pointer;
+    position: fixed;
+    left: 0;
+    height: 40px;
+    display: block;
+    overflow: hidden;
+    line-height: 28px;
+    font-size: 12px;
+    padding: 6px 10px;
+    display: none;
+    z-index: 1050;
+}
+/* ----- navigation ARROWS ----- */
+.vbox-next, .vbox-prev{
+    position: fixed;
+    top: 50%;
+    margin-top: -15px;
+    overflow: hidden;
+    cursor: pointer;
+    display: block;
+    width: 45px;
+    height: 45px;
+    z-index: 1050;
+}
+.vbox-next span, .vbox-prev span{
+    position: relative;
+    width: 20px;
+    height: 20px;
+    border: 2px solid transparent;
+    border-top-color: #B6B6B6;
+    border-right-color: #B6B6B6;
+    text-indent: -100px;
+    position: absolute;
+    top: 8px;
+    display: block;
+}
+.vbox-prev{
+    left: 15px;
+}
+.vbox-next{
+    right: 15px;
+}
+.vbox-prev span{
+    left: 10px;
+    -ms-transform: rotate(-135deg);
+    -webkit-transform: rotate(-135deg);
+    transform: rotate(-135deg);
+}
+.vbox-next span{
+    -ms-transform: rotate(45deg);
+    -webkit-transform: rotate(45deg);
+    transform: rotate(45deg);
+    right: 10px;
+}
+/* ------- inline window ------ */
+.vbox-inline{
+    width: 420px;
+    height: 315px;
+    height: 70vh;
+    padding: 10px;
+    background: #fff;
+    margin: 0 auto;
+    overflow: auto;
+    text-align: left;
+}
+/* ------- Video & iFrames window ------ */
+.venoframe{
+    max-width: 100%;
+    width: 100%;
+    border: none;
+    width: 100%;
+    height: 260px;
+    height: 70vh;
+}
+.venoframe.vbvid{
+    height: 260px;
+}
+@media (min-width: 768px) {
+    .venoframe, .vbox-inline{
+        width: 90%;
+        height: 360px;
+        height: 70vh;
+    }
+    .venoframe.vbvid{
+        width: 640px;
+        height: 360px;
+    }
+}
+@media (min-width: 992px) {
+    .venoframe, .vbox-inline{
+        max-width: 1200px;
+        width: 80%;
+        height: 540px;
+        height: 70vh;
+    }
+    .venoframe.vbvid{
+        width: 960px;
+        height: 540px;
+    }
+}
+/* 
+Please do NOT edit this part! 
+or at least read this note: http://i.imgur.com/7C0ws9e.gif
+*/
+.vbox-open{
+    overflow: hidden;
+}
+.vbox-container{
+    position: absolute;
+    left: 0;
+    right: 0;
+    top: 0;
+    bottom: 0;
+    overflow-x: hidden;
+    overflow-y: scroll;
+    overflow-scrolling: touch;
+    -webkit-overflow-scrolling: touch;
+    z-index: 20;
+    max-height: 100%;
+
+}
+
+.vbox-content{
+    text-align: center;
+    float: left;
+    width: 100%;
+    position: relative;
+    overflow: hidden;
+    padding: 20px 10px;
+}
+.vbox-container img{
+    max-width: 100%;
+    height: auto;
+}
+.figlio{
+    box-shadow: 0 0 12px rgba(0,0,0,0.19), 0 6px 6px rgba(0,0,0,0.23);
+    max-width: 100%;
+    text-align: initial;
+}
+img.figlio{
+    -webkit-user-select: none;
+-khtml-user-select: none;
+-moz-user-select: none;
+-o-user-select: none;
+user-select: none;
+}
+.vbox-content.swipe-left{
+    margin-left: -200px !important;
+}
+.vbox-content.swipe-right{
+    margin-left: 200px !important;
+}
+.animated{
+    webkit-transition: margin 300ms ease-out;
+    transition: margin 300ms ease-out;
+}
+.animate-in{
+    opacity: 1;
+}
+.animate-out{
+    opacity: 0;
+}
+/* ---------- preloader ----------
+ * SPINKIT 
+ * http://tobiasahlin.com/spinkit/
+-------------------------------- */
+.sk-double-bounce,.sk-rotating-plane{width:40px;height:40px;margin:40px auto}.sk-rotating-plane{background-color:#333;-webkit-animation:sk-rotatePlane 1.2s infinite ease-in-out;animation:sk-rotatePlane 1.2s infinite ease-in-out}@-webkit-keyframes sk-rotatePlane{0%{-webkit-transform:perspective(120px) rotateX(0) rotateY(0);transform:perspective(120px) rotateX(0) rotateY(0)}50%{-webkit-transform:perspective(120px) rotateX(-180.1deg) rotateY(0);transform:perspective(120px) rotateX(-180.1deg) rotateY(0)}100%{-webkit-transform:perspective(120px) rotateX(-180deg) rotateY(-179.9deg);transform:perspective(120px) rotateX(-180deg) rotateY(-179.9deg)}}@keyframes sk-rotatePlane{0%{-webkit-transform:perspective(120px) rotateX(0) rotateY(0);transform:perspective(120px) rotateX(0) rotateY(0)}50%{-webkit-transform:perspective(120px) rotateX(-180.1deg) rotateY(0);transform:perspective(120px) rotateX(-180.1deg) rotateY(0)}100%{-webkit-transform:perspective(120px) rotateX(-180deg) rotateY(-179.9deg);transform:perspective(120px) rotateX(-180deg) rotateY(-179.9deg)}}.sk-double-bounce{position:relative}.sk-double-bounce .sk-child{width:100%;height:100%;border-radius:50%;background-color:#333;opacity:.6;position:absolute;top:0;left:0;-webkit-animation:sk-doubleBounce 2s infinite ease-in-out;animation:sk-doubleBounce 2s infinite ease-in-out}.sk-chasing-dots .sk-child,.sk-spinner-pulse,.sk-three-bounce .sk-child{background-color:#333;border-radius:100%}.sk-double-bounce .sk-double-bounce2{-webkit-animation-delay:-1s;animation-delay:-1s}@-webkit-keyframes sk-doubleBounce{0%,100%{-webkit-transform:scale(0);transform:scale(0)}50%{-webkit-transform:scale(1);transform:scale(1)}}@keyframes sk-doubleBounce{0%,100%{-webkit-transform:scale(0);transform:scale(0)}50%{-webkit-transform:scale(1);transform:scale(1)}}.sk-wave{margin:40px auto;width:50px;height:40px;text-align:center;font-size:10px}.sk-wave .sk-rect{background-color:#333;height:100%;width:6px;display:inline-block;-webkit-animation:sk-waveStretchDelay 1.2s infinite ease-in-out;animation:sk-waveStretchDelay 1.2s infinite ease-in-out}.sk-wave .sk-rect1{-webkit-animation-delay:-1.2s;animation-delay:-1.2s}.sk-wave .sk-rect2{-webkit-animation-delay:-1.1s;animation-delay:-1.1s}.sk-wave .sk-rect3{-webkit-animation-delay:-1s;animation-delay:-1s}.sk-wave .sk-rect4{-webkit-animation-delay:-.9s;animation-delay:-.9s}.sk-wave .sk-rect5{-webkit-animation-delay:-.8s;animation-delay:-.8s}@-webkit-keyframes sk-waveStretchDelay{0%,100%,40%{-webkit-transform:scaleY(.4);transform:scaleY(.4)}20%{-webkit-transform:scaleY(1);transform:scaleY(1)}}@keyframes sk-waveStretchDelay{0%,100%,40%{-webkit-transform:scaleY(.4);transform:scaleY(.4)}20%{-webkit-transform:scaleY(1);transform:scaleY(1)}}.sk-wandering-cubes{margin:40px auto;width:40px;height:40px;position:relative}.sk-wandering-cubes .sk-cube{background-color:#333;width:10px;height:10px;position:absolute;top:0;left:0;-webkit-animation:sk-wanderingCube 1.8s ease-in-out -1.8s infinite both;animation:sk-wanderingCube 1.8s ease-in-out -1.8s infinite both}.sk-chasing-dots,.sk-spinner-pulse{width:40px;height:40px;margin:40px auto}.sk-wandering-cubes .sk-cube2{-webkit-animation-delay:-.9s;animation-delay:-.9s}@-webkit-keyframes sk-wanderingCube{0%{-webkit-transform:rotate(0);transform:rotate(0)}25%{-webkit-transform:translateX(30px) rotate(-90deg) scale(.5);transform:translateX(30px) rotate(-90deg) scale(.5)}50%{-webkit-transform:translateX(30px) translateY(30px) rotate(-179deg);transform:translateX(30px) translateY(30px) rotate(-179deg)}50.1%{-webkit-transform:translateX(30px) translateY(30px) rotate(-180deg);transform:translateX(30px) translateY(30px) rotate(-180deg)}75%{-webkit-transform:translateX(0) translateY(30px) rotate(-270deg) scale(.5);transform:translateX(0) translateY(30px) rotate(-270deg) scale(.5)}100%{-webkit-transform:rotate(-360deg);transform:rotate(-360deg)}}@keyframes sk-wanderingCube{0%{-webkit-transform:rotate(0);transform:rotate(0)}25%{-webkit-transform:translateX(30px) rotate(-90deg) scale(.5);transform:translateX(30px) rotate(-90deg) scale(.5)}50%{-webkit-transform:translateX(30px) translateY(30px) rotate(-179deg);transform:translateX(30px) translateY(30px) rotate(-179deg)}50.1%{-webkit-transform:translateX(30px) translateY(30px) rotate(-180deg);transform:translateX(30px) translateY(30px) rotate(-180deg)}75%{-webkit-transform:translateX(0) translateY(30px) rotate(-270deg) scale(.5);transform:translateX(0) translateY(30px) rotate(-270deg) scale(.5)}100%{-webkit-transform:rotate(-360deg);transform:rotate(-360deg)}}.sk-spinner-pulse{-webkit-animation:sk-pulseScaleOut 1s infinite ease-in-out;animation:sk-pulseScaleOut 1s infinite ease-in-out}@-webkit-keyframes sk-pulseScaleOut{0%{-webkit-transform:scale(0);transform:scale(0)}100%{-webkit-transform:scale(1);transform:scale(1);opacity:0}}@keyframes sk-pulseScaleOut{0%{-webkit-transform:scale(0);transform:scale(0)}100%{-webkit-transform:scale(1);transform:scale(1);opacity:0}}.sk-chasing-dots{position:relative;text-align:center;-webkit-animation:sk-chasingDotsRotate 2s infinite linear;animation:sk-chasingDotsRotate 2s infinite linear}.sk-chasing-dots .sk-child{width:60%;height:60%;display:inline-block;position:absolute;top:0;-webkit-animation:sk-chasingDotsBounce 2s infinite ease-in-out;animation:sk-chasingDotsBounce 2s infinite ease-in-out}.sk-chasing-dots .sk-dot2{top:auto;bottom:0;-webkit-animation-delay:-1s;animation-delay:-1s}@-webkit-keyframes sk-chasingDotsRotate{100%{-webkit-transform:rotate(360deg);transform:rotate(360deg)}}@keyframes sk-chasingDotsRotate{100%{-webkit-transform:rotate(360deg);transform:rotate(360deg)}}@-webkit-keyframes sk-chasingDotsBounce{0%,100%{-webkit-transform:scale(0);transform:scale(0)}50%{-webkit-transform:scale(1);transform:scale(1)}}@keyframes sk-chasingDotsBounce{0%,100%{-webkit-transform:scale(0);transform:scale(0)}50%{-webkit-transform:scale(1);transform:scale(1)}}.sk-three-bounce{margin:40px auto;width:80px;text-align:center}.sk-three-bounce .sk-child{width:20px;height:20px;display:inline-block;-webkit-animation:sk-three-bounce 1.4s ease-in-out 0s infinite both;animation:sk-three-bounce 1.4s ease-in-out 0s infinite both}.sk-circle .sk-child:before,.sk-fading-circle .sk-circle:before{display:block;border-radius:100%;content:'';background-color:#333}.sk-three-bounce .sk-bounce1{-webkit-animation-delay:-.32s;animation-delay:-.32s}.sk-three-bounce .sk-bounce2{-webkit-animation-delay:-.16s;animation-delay:-.16s}@-webkit-keyframes sk-three-bounce{0%,100%,80%{-webkit-transform:scale(0);transform:scale(0)}40%{-webkit-transform:scale(1);transform:scale(1)}}@keyframes sk-three-bounce{0%,100%,80%{-webkit-transform:scale(0);transform:scale(0)}40%{-webkit-transform:scale(1);transform:scale(1)}}.sk-circle{margin:40px auto;width:40px;height:40px;position:relative}.sk-circle .sk-child{width:100%;height:100%;position:absolute;left:0;top:0}.sk-circle .sk-child:before{margin:0 auto;width:15%;height:15%;-webkit-animation:sk-circleBounceDelay 1.2s infinite ease-in-out both;animation:sk-circleBounceDelay 1.2s infinite ease-in-out both}.sk-circle .sk-circle2{-webkit-transform:rotate(30deg);-ms-transform:rotate(30deg);transform:rotate(30deg)}.sk-circle .sk-circle3{-webkit-transform:rotate(60deg);-ms-transform:rotate(60deg);transform:rotate(60deg)}.sk-circle .sk-circle4{-webkit-transform:rotate(90deg);-ms-transform:rotate(90deg);transform:rotate(90deg)}.sk-circle .sk-circle5{-webkit-transform:rotate(120deg);-ms-transform:rotate(120deg);transform:rotate(120deg)}.sk-circle .sk-circle6{-webkit-transform:rotate(150deg);-ms-transform:rotate(150deg);transform:rotate(150deg)}.sk-circle .sk-circle7{-webkit-transform:rotate(180deg);-ms-transform:rotate(180deg);transform:rotate(180deg)}.sk-circle .sk-circle8{-webkit-transform:rotate(210deg);-ms-transform:rotate(210deg);transform:rotate(210deg)}.sk-circle .sk-circle9{-webkit-transform:rotate(240deg);-ms-transform:rotate(240deg);transform:rotate(240deg)}.sk-circle .sk-circle10{-webkit-transform:rotate(270deg);-ms-transform:rotate(270deg);transform:rotate(270deg)}.sk-circle .sk-circle11{-webkit-transform:rotate(300deg);-ms-transform:rotate(300deg);transform:rotate(300deg)}.sk-circle .sk-circle12{-webkit-transform:rotate(330deg);-ms-transform:rotate(330deg);transform:rotate(330deg)}.sk-circle .sk-circle2:before{-webkit-animation-delay:-1.1s;animation-delay:-1.1s}.sk-circle .sk-circle3:before{-webkit-animation-delay:-1s;animation-delay:-1s}.sk-circle .sk-circle4:before{-webkit-animation-delay:-.9s;animation-delay:-.9s}.sk-circle .sk-circle5:before{-webkit-animation-delay:-.8s;animation-delay:-.8s}.sk-circle .sk-circle6:before{-webkit-animation-delay:-.7s;animation-delay:-.7s}.sk-circle .sk-circle7:before{-webkit-animation-delay:-.6s;animation-delay:-.6s}.sk-circle .sk-circle8:before{-webkit-animation-delay:-.5s;animation-delay:-.5s}.sk-circle .sk-circle9:before{-webkit-animation-delay:-.4s;animation-delay:-.4s}.sk-circle .sk-circle10:before{-webkit-animation-delay:-.3s;animation-delay:-.3s}.sk-circle .sk-circle11:before{-webkit-animation-delay:-.2s;animation-delay:-.2s}.sk-circle .sk-circle12:before{-webkit-animation-delay:-.1s;animation-delay:-.1s}@-webkit-keyframes sk-circleBounceDelay{0%,100%,80%{-webkit-transform:scale(0);transform:scale(0)}40%{-webkit-transform:scale(1);transform:scale(1)}}@keyframes sk-circleBounceDelay{0%,100%,80%{-webkit-transform:scale(0);transform:scale(0)}40%{-webkit-transform:scale(1);transform:scale(1)}}.sk-cube-grid{width:40px;height:40px;margin:40px auto}.sk-cube-grid .sk-cube{width:33.33%;height:33.33%;background-color:#333;float:left;-webkit-animation:sk-cubeGridScaleDelay 1.3s infinite ease-in-out;animation:sk-cubeGridScaleDelay 1.3s infinite ease-in-out}.sk-cube-grid .sk-cube1{-webkit-animation-delay:.2s;animation-delay:.2s}.sk-cube-grid .sk-cube2{-webkit-animation-delay:.3s;animation-delay:.3s}.sk-cube-grid .sk-cube3{-webkit-animation-delay:.4s;animation-delay:.4s}.sk-cube-grid .sk-cube4{-webkit-animation-delay:.1s;animation-delay:.1s}.sk-cube-grid .sk-cube5{-webkit-animation-delay:.2s;animation-delay:.2s}.sk-cube-grid .sk-cube6{-webkit-animation-delay:.3s;animation-delay:.3s}.sk-cube-grid .sk-cube7{-webkit-animation-delay:0ms;animation-delay:0ms}.sk-cube-grid .sk-cube8{-webkit-animation-delay:.1s;animation-delay:.1s}.sk-cube-grid .sk-cube9{-webkit-animation-delay:.2s;animation-delay:.2s}@-webkit-keyframes sk-cubeGridScaleDelay{0%,100%,70%{-webkit-transform:scale3D(1,1,1);transform:scale3D(1,1,1)}35%{-webkit-transform:scale3D(0,0,1);transform:scale3D(0,0,1)}}@keyframes sk-cubeGridScaleDelay{0%,100%,70%{-webkit-transform:scale3D(1,1,1);transform:scale3D(1,1,1)}35%{-webkit-transform:scale3D(0,0,1);transform:scale3D(0,0,1)}}.sk-fading-circle{margin:40px auto;width:40px;height:40px;position:relative}.sk-fading-circle .sk-circle{width:100%;height:100%;position:absolute;left:0;top:0}.sk-fading-circle .sk-circle:before{margin:0 auto;width:15%;height:15%;-webkit-animation:sk-circleFadeDelay 1.2s infinite ease-in-out both;animation:sk-circleFadeDelay 1.2s infinite ease-in-out both}.sk-fading-circle .sk-circle2{-webkit-transform:rotate(30deg);-ms-transform:rotate(30deg);transform:rotate(30deg)}.sk-fading-circle .sk-circle3{-webkit-transform:rotate(60deg);-ms-transform:rotate(60deg);transform:rotate(60deg)}.sk-fading-circle .sk-circle4{-webkit-transform:rotate(90deg);-ms-transform:rotate(90deg);transform:rotate(90deg)}.sk-fading-circle .sk-circle5{-webkit-transform:rotate(120deg);-ms-transform:rotate(120deg);transform:rotate(120deg)}.sk-fading-circle .sk-circle6{-webkit-transform:rotate(150deg);-ms-transform:rotate(150deg);transform:rotate(150deg)}.sk-fading-circle .sk-circle7{-webkit-transform:rotate(180deg);-ms-transform:rotate(180deg);transform:rotate(180deg)}.sk-fading-circle .sk-circle8{-webkit-transform:rotate(210deg);-ms-transform:rotate(210deg);transform:rotate(210deg)}.sk-fading-circle .sk-circle9{-webkit-transform:rotate(240deg);-ms-transform:rotate(240deg);transform:rotate(240deg)}.sk-fading-circle .sk-circle10{-webkit-transform:rotate(270deg);-ms-transform:rotate(270deg);transform:rotate(270deg)}.sk-fading-circle .sk-circle11{-webkit-transform:rotate(300deg);-ms-transform:rotate(300deg);transform:rotate(300deg)}.sk-fading-circle .sk-circle12{-webkit-transform:rotate(330deg);-ms-transform:rotate(330deg);transform:rotate(330deg)}.sk-fading-circle .sk-circle2:before{-webkit-animation-delay:-1.1s;animation-delay:-1.1s}.sk-fading-circle .sk-circle3:before{-webkit-animation-delay:-1s;animation-delay:-1s}.sk-fading-circle .sk-circle4:before{-webkit-animation-delay:-.9s;animation-delay:-.9s}.sk-fading-circle .sk-circle5:before{-webkit-animation-delay:-.8s;animation-delay:-.8s}.sk-fading-circle .sk-circle6:before{-webkit-animation-delay:-.7s;animation-delay:-.7s}.sk-fading-circle .sk-circle7:before{-webkit-animation-delay:-.6s;animation-delay:-.6s}.sk-fading-circle .sk-circle8:before{-webkit-animation-delay:-.5s;animation-delay:-.5s}.sk-fading-circle .sk-circle9:before{-webkit-animation-delay:-.4s;animation-delay:-.4s}.sk-fading-circle .sk-circle10:before{-webkit-animation-delay:-.3s;animation-delay:-.3s}.sk-fading-circle .sk-circle11:before{-webkit-animation-delay:-.2s;animation-delay:-.2s}.sk-fading-circle .sk-circle12:before{-webkit-animation-delay:-.1s;animation-delay:-.1s}@-webkit-keyframes sk-circleFadeDelay{0%,100%,39%{opacity:0}40%{opacity:1}}@keyframes sk-circleFadeDelay{0%,100%,39%{opacity:0}40%{opacity:1}}.sk-folding-cube{margin:40px auto;width:40px;height:40px;position:relative;-webkit-transform:rotateZ(45deg);transform:rotateZ(45deg)}.sk-folding-cube .sk-cube{float:left;width:50%;height:50%;position:relative;-webkit-transform:scale(1.1);-ms-transform:scale(1.1);transform:scale(1.1)}.sk-folding-cube .sk-cube:before{content:'';position:absolute;top:0;left:0;width:100%;height:100%;background-color:#333;-webkit-animation:sk-foldCubeAngle 2.4s infinite linear both;animation:sk-foldCubeAngle 2.4s infinite linear both;-webkit-transform-origin:100% 100%;-ms-transform-origin:100% 100%;transform-origin:100% 100%}.sk-folding-cube .sk-cube2{-webkit-transform:scale(1.1) rotateZ(90deg);transform:scale(1.1) rotateZ(90deg)}.sk-folding-cube .sk-cube3{-webkit-transform:scale(1.1) rotateZ(180deg);transform:scale(1.1) rotateZ(180deg)}.sk-folding-cube .sk-cube4{-webkit-transform:scale(1.1) rotateZ(270deg);transform:scale(1.1) rotateZ(270deg)}.sk-folding-cube .sk-cube2:before{-webkit-animation-delay:.3s;animation-delay:.3s}.sk-folding-cube .sk-cube3:before{-webkit-animation-delay:.6s;animation-delay:.6s}.sk-folding-cube .sk-cube4:before{-webkit-animation-delay:.9s;animation-delay:.9s}@-webkit-keyframes sk-foldCubeAngle{0%,10%{-webkit-transform:perspective(140px) rotateX(-180deg);transform:perspective(140px) rotateX(-180deg);opacity:0}25%,75%{-webkit-transform:perspective(140px) rotateX(0);transform:perspective(140px) rotateX(0);opacity:1}100%,90%{-webkit-transform:perspective(140px) rotateY(180deg);transform:perspective(140px) rotateY(180deg);opacity:0}}@keyframes sk-foldCubeAngle{0%,10%{-webkit-transform:perspective(140px) rotateX(-180deg);transform:perspective(140px) rotateX(-180deg);opacity:0}25%,75%{-webkit-transform:perspective(140px) rotateX(0);transform:perspective(140px) rotateX(0);opacity:1}100%,90%{-webkit-transform:perspective(140px) rotateY(180deg);transform:perspective(140px) rotateY(180deg);opacity:0}}
diff --git a/plugins/venobox/venobox.min.js b/plugins/venobox/venobox.min.js
new file mode 100644
index 00000000..bdb39d05
--- /dev/null
+++ b/plugins/venobox/venobox.min.js
@@ -0,0 +1,12 @@
+/*
+ * VenoBox - jQuery Plugin
+ * version: 1.8.3
+ * @requires jQuery >= 1.7.0
+ *
+ * Examples at http://veno.es/venobox/
+ * License: MIT License
+ * License URI: https://github.com/nicolafranchini/VenoBox/blob/master/LICENSE
+ * Copyright 2013-2017 Nicola Franchini - @nicolafranchini
+ *
+ */
+!function(e){"use strict";var s,i,c,a,o,t,d,l,r,n,v,u,b,k,p,m,h,f,g,x,y,w,C,_,B,P,E,O,D,M,N,U,V,I,z,R,X,Y,j,W,q;e.fn.extend({venobox:function($){var A=this,H=e.extend({arrowsColor:"#B6B6B6",autoplay:!1,bgcolor:"#fff",border:"0",closeBackground:"#161617",closeColor:"#d2d2d2",framewidth:"",frameheight:"",gallItems:!1,infinigall:!1,htmlClose:"&times;",htmlNext:"<span>Next</span>",htmlPrev:"<span>Prev</span>",numeratio:!1,numerationBackground:"#161617",numerationColor:"#d2d2d2",numerationPosition:"top",overlayClose:!0,overlayColor:"rgba(23,23,23,0.85)",spinner:"double-bounce",spinColor:"#d2d2d2",titleattr:"title",titleBackground:"#161617",titleColor:"#d2d2d2",titlePosition:"top",cb_pre_open:function(){return!0},cb_post_open:function(){},cb_pre_close:function(){return!0},cb_post_close:function(){},cb_post_resize:function(){},cb_after_nav:function(){},cb_init:function(){}},$);return H.cb_init(A),this.each(function(){if((D=e(this)).data("venobox"))return!0;function $(){y=D.data("gall"),h=D.data("numeratio"),u=D.data("gallItems"),b=D.data("infinigall"),k=u||e('.vbox-item[data-gall="'+y+'"]'),w=k.eq(k.index(D)+1),C=k.eq(k.index(D)-1),w.length||!0!==b||(w=k.eq(0)),k.length>1?(M=k.index(D)+1,c.html(M+" / "+k.length)):M=1,!0===h?c.show():c.hide(),""!==x?a.show():a.hide(),w.length||!0===b?(e(".vbox-next").css("display","block"),_=!0):(e(".vbox-next").css("display","none"),_=!1),k.index(D)>0||!0===b?(e(".vbox-prev").css("display","block"),B=!0):(e(".vbox-prev").css("display","none"),B=!1),!0!==B&&!0!==_||(d.on(K.DOWN,F),d.on(K.MOVE,G),d.on(K.UP,J))}function Q(e){return!(e.length<1)&&(!p&&(p=!0,f=e.data("overlay")||e.data("overlaycolor"),n=e.data("framewidth"),v=e.data("frameheight"),o=e.data("border"),i=e.data("bgcolor"),l=e.data("href")||e.attr("href"),s=e.data("autoplay"),x=e.attr(e.data("titleattr"))||"",e===C&&d.addClass("animated").addClass("swipe-right"),e===w&&d.addClass("animated").addClass("swipe-left"),E.show(),void d.animate({opacity:0},500,function(){g.css("background",f),d.removeClass("animated").removeClass("swipe-left").removeClass("swipe-right").css({"margin-left":0,"margin-right":0}),"iframe"==e.data("vbtype")?ce():"inline"==e.data("vbtype")?oe():"ajax"==e.data("vbtype")?ie():"video"==e.data("vbtype")?ae(s):(d.html('<img src="'+l+'">'),te()),D=e,$(),p=!1,H.cb_after_nav(D,M,w,C)})))}function S(e){27===e.keyCode&&T(),37==e.keyCode&&!0===B&&Q(C),39==e.keyCode&&!0===_&&Q(w)}function T(){if(!1===H.cb_pre_close(D,M,w,C))return!1;e("body").off("keydown",S).removeClass("vbox-open"),D.focus(),g.animate({opacity:0},500,function(){g.remove(),p=!1,H.cb_post_close()})}A.VBclose=function(){T()},D.addClass("vbox-item"),D.data("framewidth",H.framewidth),D.data("frameheight",H.frameheight),D.data("border",H.border),D.data("bgcolor",H.bgcolor),D.data("numeratio",H.numeratio),D.data("gallItems",H.gallItems),D.data("infinigall",H.infinigall),D.data("overlaycolor",H.overlayColor),D.data("titleattr",H.titleattr),D.data("venobox",!0),D.on("click",function(u){if(u.preventDefault(),D=e(this),!1===H.cb_pre_open(D))return!1;switch(A.VBnext=function(){Q(w)},A.VBprev=function(){Q(C)},f=D.data("overlay")||D.data("overlaycolor"),n=D.data("framewidth"),v=D.data("frameheight"),s=D.data("autoplay")||H.autoplay,o=D.data("border"),i=D.data("bgcolor"),_=!1,B=!1,p=!1,l=D.data("href")||D.attr("href"),r=D.data("css")||"",x=D.attr(D.data("titleattr"))||"",P='<div class="vbox-preloader">',H.spinner){case"rotating-plane":P+='<div class="sk-rotating-plane"></div>';break;case"double-bounce":P+='<div class="sk-double-bounce"><div class="sk-child sk-double-bounce1"></div><div class="sk-child sk-double-bounce2"></div></div>';break;case"wave":P+='<div class="sk-wave"><div class="sk-rect sk-rect1"></div><div class="sk-rect sk-rect2"></div><div class="sk-rect sk-rect3"></div><div class="sk-rect sk-rect4"></div><div class="sk-rect sk-rect5"></div></div>';break;case"wandering-cubes":P+='<div class="sk-wandering-cubes"><div class="sk-cube sk-cube1"></div><div class="sk-cube sk-cube2"></div></div>';break;case"spinner-pulse":P+='<div class="sk-spinner sk-spinner-pulse"></div>';break;case"chasing-dots":P+='<div class="sk-chasing-dots"><div class="sk-child sk-dot1"></div><div class="sk-child sk-dot2"></div></div>';break;case"three-bounce":P+='<div class="sk-three-bounce"><div class="sk-child sk-bounce1"></div><div class="sk-child sk-bounce2"></div><div class="sk-child sk-bounce3"></div></div>';break;case"circle":P+='<div class="sk-circle"><div class="sk-circle1 sk-child"></div><div class="sk-circle2 sk-child"></div><div class="sk-circle3 sk-child"></div><div class="sk-circle4 sk-child"></div><div class="sk-circle5 sk-child"></div><div class="sk-circle6 sk-child"></div><div class="sk-circle7 sk-child"></div><div class="sk-circle8 sk-child"></div><div class="sk-circle9 sk-child"></div><div class="sk-circle10 sk-child"></div><div class="sk-circle11 sk-child"></div><div class="sk-circle12 sk-child"></div></div>';break;case"cube-grid":P+='<div class="sk-cube-grid"><div class="sk-cube sk-cube1"></div><div class="sk-cube sk-cube2"></div><div class="sk-cube sk-cube3"></div><div class="sk-cube sk-cube4"></div><div class="sk-cube sk-cube5"></div><div class="sk-cube sk-cube6"></div><div class="sk-cube sk-cube7"></div><div class="sk-cube sk-cube8"></div><div class="sk-cube sk-cube9"></div></div>';break;case"fading-circle":P+='<div class="sk-fading-circle"><div class="sk-circle1 sk-circle"></div><div class="sk-circle2 sk-circle"></div><div class="sk-circle3 sk-circle"></div><div class="sk-circle4 sk-circle"></div><div class="sk-circle5 sk-circle"></div><div class="sk-circle6 sk-circle"></div><div class="sk-circle7 sk-circle"></div><div class="sk-circle8 sk-circle"></div><div class="sk-circle9 sk-circle"></div><div class="sk-circle10 sk-circle"></div><div class="sk-circle11 sk-circle"></div><div class="sk-circle12 sk-circle"></div></div>';break;case"folding-cube":P+='<div class="sk-folding-cube"><div class="sk-cube1 sk-cube"></div><div class="sk-cube2 sk-cube"></div><div class="sk-cube4 sk-cube"></div><div class="sk-cube3 sk-cube"></div></div>'}return P+="</div>",O='<a class="vbox-next">'+H.htmlNext+'</a><a class="vbox-prev">'+H.htmlPrev+"</a>",U='<div class="vbox-title"></div><div class="vbox-num">0/0</div><div class="vbox-close">'+H.htmlClose+"</div>",t='<div class="vbox-overlay '+r+'" style="background:'+f+'">'+P+'<div class="vbox-container"><div class="vbox-content"></div></div>'+U+O+"</div>",e("body").append(t).addClass("vbox-open"),e(".vbox-preloader div:not(.sk-circle) .sk-child, .vbox-preloader .sk-rotating-plane, .vbox-preloader .sk-rect, .vbox-preloader div:not(.sk-folding-cube) .sk-cube, .vbox-preloader .sk-spinner-pulse").css("background-color",H.spinColor),g=e(".vbox-overlay"),e(".vbox-container"),d=e(".vbox-content"),c=e(".vbox-num"),a=e(".vbox-title"),(E=e(".vbox-preloader")).show(),a.css(H.titlePosition,"-1px"),a.css({color:H.titleColor,"background-color":H.titleBackground}),e(".vbox-close").css({color:H.closeColor,"background-color":H.closeBackground}),e(".vbox-num").css(H.numerationPosition,"-1px"),e(".vbox-num").css({color:H.numerationColor,"background-color":H.numerationBackground}),e(".vbox-next span, .vbox-prev span").css({"border-top-color":H.arrowsColor,"border-right-color":H.arrowsColor}),d.html(""),d.css("opacity","0"),g.css("opacity","0"),$(),g.animate({opacity:1},250,function(){"iframe"==D.data("vbtype")?ce():"inline"==D.data("vbtype")?oe():"ajax"==D.data("vbtype")?ie():"video"==D.data("vbtype")?ae(s):(d.html('<img src="'+l+'">'),te()),H.cb_post_open(D,M,w,C)}),e("body").keydown(S),e(".vbox-prev").on("click",function(){Q(C)}),e(".vbox-next").on("click",function(){Q(w)}),!1});var Z=".vbox-overlay";function F(e){d.addClass("animated"),I=R=e.pageY,z=X=e.pageX,N=!0}function G(e){if(!0===N){X=e.pageX,R=e.pageY,j=X-z,W=R-I;var s=Math.abs(j);s>Math.abs(W)&&s<=100&&(e.preventDefault(),d.css("margin-left",j))}}function J(e){if(!0===N){N=!1;var s=D,i=!1;(Y=X-z)<0&&!0===_&&(s=w,i=!0),Y>0&&!0===B&&(s=C,i=!0),Math.abs(Y)>=q&&!0===i?Q(s):d.css({"margin-left":0,"margin-right":0})}}H.overlayClose||(Z=".vbox-close"),e("body").on("click",Z,function(s){(e(s.target).is(".vbox-overlay")||e(s.target).is(".vbox-content")||e(s.target).is(".vbox-close")||e(s.target).is(".vbox-preloader"))&&T()}),z=0,X=0,Y=0,q=50,N=!1;var K={DOWN:"touchmousedown",UP:"touchmouseup",MOVE:"touchmousemove"},L=function(s){var i;switch(s.type){case"mousedown":i=K.DOWN;break;case"mouseup":case"mouseout":i=K.UP;break;case"mousemove":i=K.MOVE;break;default:return}var c=se(i,s,s.pageX,s.pageY);e(s.target).trigger(c)},ee=function(s){var i;switch(s.type){case"touchstart":i=K.DOWN;break;case"touchend":i=K.UP;break;case"touchmove":i=K.MOVE;break;default:return}var c,a=s.originalEvent.touches[0];c=i==K.UP?se(i,s,null,null):se(i,s,a.pageX,a.pageY),e(s.target).trigger(c)},se=function(s,i,c,a){return e.Event(s,{pageX:c,pageY:a,originalEvent:i})};function ie(){e.ajax({url:l,cache:!1}).done(function(e){d.html('<div class="vbox-inline">'+e+"</div>"),te()}).fail(function(){d.html('<div class="vbox-inline"><p>Error retrieving contents, please retry</div>'),de()})}function ce(){d.html('<iframe class="venoframe" src="'+l+'"></iframe>'),de()}function ae(e){var s,i=function(e){var s;e.match(/(http:|https:|)\/\/(player.|www.)?(vimeo\.com|youtu(be\.com|\.be|be\.googleapis\.com))\/(video\/|embed\/|watch\?v=|v\/)?([A-Za-z0-9._%-]*)(\&\S+)?/),RegExp.$3.indexOf("youtu")>-1?s="youtube":RegExp.$3.indexOf("vimeo")>-1&&(s="vimeo");return{type:s,id:RegExp.$6}}(l),c=(e?"?rel=0&autoplay=1":"?rel=0")+function(e){var s="",i=decodeURIComponent(e).split("?");if(void 0!==i[1]){var c,a,o=i[1].split("&");for(a=0;a<o.length;a++)c=o[a].split("="),s=s+"&"+c[0]+"="+c[1]}return encodeURI(s)}(l);"vimeo"==i.type?s="https://player.vimeo.com/video/":"youtube"==i.type&&(s="https://www.youtube.com/embed/"),d.html('<iframe class="venoframe vbvid" webkitallowfullscreen mozallowfullscreen allowfullscreen frameborder="0" src="'+s+i.id+c+'"></iframe>'),de()}function oe(){d.html('<div class="vbox-inline">'+e(l).html()+"</div>"),de()}function te(){(V=d.find("img")).length?V.each(function(){e(this).one("load",function(){de()})}):de()}function de(){a.html(x),d.find(">:first-child").addClass("figlio").css({width:n,height:v,padding:o,background:i}),e("img.figlio").on("dragstart",function(e){e.preventDefault()}),le(),d.animate({opacity:"1"},"slow",function(){E.hide()})}function le(){var s=d.outerHeight(),i=e(window).height();m=s+60<i?(i-s)/2:"30px",d.css("margin-top",m),d.css("margin-bottom",m),H.cb_post_resize()}"ontouchstart"in window?(e(document).on("touchstart",ee),e(document).on("touchmove",ee),e(document).on("touchend",ee)):(e(document).on("mousedown",L),e(document).on("mouseup",L),e(document).on("mouseout",L),e(document).on("mousemove",L)),e(window).resize(function(){e(".vbox-content").length&&setTimeout(le(),800)})})}})}(jQuery);
diff --git a/post/2nd-international-workshop-on-benchmarking-rdf-systems/index.html b/post/2nd-international-workshop-on-benchmarking-rdf-systems/index.html
new file mode 100644
index 00000000..657f68fd
--- /dev/null
+++ b/post/2nd-international-workshop-on-benchmarking-rdf-systems/index.html
@@ -0,0 +1,463 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>2nd International Workshop on Benchmarking RDF Systems</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">2nd International Workshop on Benchmarking RDF Systems</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">2nd International Workshop on Benchmarking RDF Systems</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">LDBC</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.</p>
+<p>More at: <a href="http://events.sti2.at/bersys2014/">http://events.sti2.at/bersys2014/</a></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/workshop">WORKSHOP</a>
+            , <a href="/tags/cfp">CFP</a>
+            , <a href="/tags/benchmark">BENCHMARK</a>
+            , <a href="/tags/bersys">BERSYS</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/announcing-the-ldbc-financial-benchmark-task-force/index.html b/post/announcing-the-ldbc-financial-benchmark-task-force/index.html
new file mode 100644
index 00000000..1f6350ae
--- /dev/null
+++ b/post/announcing-the-ldbc-financial-benchmark-task-force/index.html
@@ -0,0 +1,463 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Announcing the LDBC Financial Benchmark Task Force</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Announcing the LDBC Financial Benchmark Task Force</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Announcing the LDBC Financial Benchmark Task Force</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Gábor Szárnyas</strong> / on <strong class="text-dark">26 May 2022</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.</p>
+<p>Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.</p>
+<p>The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">Work Charter for FinBench</a></p>
+<p>If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/finbench">FINBENCH</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/announcing-the-official-release-of-ldbc-financial-benchmark/index.html b/post/announcing-the-official-release-of-ldbc-financial-benchmark/index.html
new file mode 100644
index 00000000..38981c1f
--- /dev/null
+++ b/post/announcing-the-official-release-of-ldbc-financial-benchmark/index.html
@@ -0,0 +1,463 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Shipeng Qi</strong> / on <strong class="text-dark">27 Jun 2023</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.</p>
+<p>Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the <a href="/benchmarks/finbench/finbench-talk-16th-tuc.pdf">slides</a> in the 16th TUC. The <a href="https://arxiv.org/pdf/2306.15975.pdf">Financial Benchmark&rsquo;s specification</a> can be found on arXiv.</p>
+<p>The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.</p>
+<p>If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/finbench">FINBENCH</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/choke-point-based-benchmark-design/chokepoints.png b/post/choke-point-based-benchmark-design/chokepoints.png
new file mode 100644
index 00000000..43471568
Binary files /dev/null and b/post/choke-point-based-benchmark-design/chokepoints.png differ
diff --git a/post/choke-point-based-benchmark-design/index.html b/post/choke-point-based-benchmark-design/index.html
new file mode 100644
index 00000000..3ea23899
--- /dev/null
+++ b/post/choke-point-based-benchmark-design/index.html
@@ -0,0 +1,472 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Choke Point Based Benchmark Design</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Choke Point Based Benchmark Design</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Choke Point Based Benchmark Design</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">14 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (<a href="/event/fifth-tuc-meeting">next TUC meeting</a> will be on October 5 in Athens) and indeed in <em>designing benchmarks</em>.</p>
+<p>So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by <a href="http://www.tpc.org/">TPC</a> have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are <em>relevant</em> and <em>representative</em> (address important challenges encountered in practice), <em>understandable</em> , <em>economical</em> (implementable on simple hardware), <em>fair</em> (such as not to favor a particular product or approach), <em>scalable</em>, <em>accepted</em> by the community  and <em>public</em> (e.g. all of its software is available in open source). This list stems from Jim Gray&rsquo;s <a href="http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm">Benchmark Handbook</a>. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.</p>
+<p>A very important aspect of benchmark development is making sure that the community <em>accepts</em> a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on <strong>fairness</strong> had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its <a href="/tags/tuc-meeting/">Technical User Community gatherings</a>) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.</p>
+<p>The need for <em>understandability</em> for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.</p>
+<p>The <em>economical</em> aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.</p>
+<p><em>Representative</em> benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the <a href="http://aksw.org/Projects/DBPSB.html">DBpedia benchmark</a> whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).</p>
+<p>The fact that a benchmark can be <em>scaled</em> in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.</p>
+<p>Now, what makes a benchmark <em>relevant</em>? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of <em>&ldquo;choke points&rdquo;</em>: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.</p>
+<p>To illustrate what choke points are in more depth, we wrote a <a href="/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf">paper in the TPCTC 2013</a> conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. <em><a href="chokepoints.png">This table</a></em> lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):</p>
+<p>I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can <a href="http://www.openlinksw.com/weblog/oerling/?id=1779">trivialize Q18</a>; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.</p>
+<p>LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark <a href="/developer/spb">(SPB)</a> and the more graph-focused Social Network Benchmark (<a href="/developer/snb">SNB</a>),  and <a href="https://groups.google.com/forum/#!forum/ldbcouncil">tell us what you think</a>. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.</p>
+<p><em>(for more posts from Peter Boncz, see also <a href="https://databasearchitects.blogspot.com">Database Architects</a>, a blog about data management challenges and techniques written by people who design and implement database systems)</em></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/database">DATABASE</a>
+            , <a href="/tags/benchmark">BENCHMARK</a>
+            , <a href="/tags/design">DESIGN</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/datagen-a-realistic-social-network-data-generator/Cumulative-distribution.png b/post/datagen-a-realistic-social-network-data-generator/Cumulative-distribution.png
new file mode 100644
index 00000000..90b5b107
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/Cumulative-distribution.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/chinese-friends.png b/post/datagen-a-realistic-social-network-data-generator/chinese-friends.png
new file mode 100644
index 00000000..4d11e93f
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/chinese-friends.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/distribution-germany.png b/post/datagen-a-realistic-social-network-data-generator/distribution-germany.png
new file mode 100644
index 00000000..1524b8d2
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/distribution-germany.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/distribution-netherlands.png b/post/datagen-a-realistic-social-network-data-generator/distribution-netherlands.png
new file mode 100644
index 00000000..05b338c1
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/distribution-netherlands.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/distribution-vietnam.png b/post/datagen-a-realistic-social-network-data-generator/distribution-vietnam.png
new file mode 100644
index 00000000..29bb8679
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/distribution-vietnam.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/friends-international-school.png b/post/datagen-a-realistic-social-network-data-generator/friends-international-school.png
new file mode 100644
index 00000000..0d3ca9f4
Binary files /dev/null and b/post/datagen-a-realistic-social-network-data-generator/friends-international-school.png differ
diff --git a/post/datagen-a-realistic-social-network-data-generator/index.html b/post/datagen-a-realistic-social-network-data-generator/index.html
new file mode 100644
index 00000000..7a83d4cf
--- /dev/null
+++ b/post/datagen-a-realistic-social-network-data-generator/index.html
@@ -0,0 +1,569 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>DATAGEN: a Realistic Social Network Data Generator</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">DATAGEN: a Realistic Social Network Data Generator</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">DATAGEN: a Realistic Social Network Data Generator</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Duc Pham</strong> / on <strong class="text-dark">06 Dec 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the <a href="https://github.com/ldbc/ldbc_snb_datagen">instructions for generating a SNB dataset</a> and <a href="https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso">for loading the dataset into Virtuoso</a>. In the following sections, we analyze several aspects of the generated dataset.</p>
+<h3 id="a-realistic-social-graph">A Realistic social graph</h3>
+<p>One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their <em><knows></em> relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about <a href="https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859">Facebook Anatomy</a>). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&rsquo;s graph distribution.</p>
+<p><img src="Cumulative-distribution.png" alt="image"> <br>
+Figure 1: Cumulative distribution #friends per user</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-r" data-lang="r"><span style="display:flex;"><span><span style="color:#75715e">#R script for generating the social degree distribution </span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">#Input files: person_knows_person_*.csv</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">library</span>(data.table)
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">library</span>(igraph)
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">library</span>(plotrix)
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">require</span>(bit64)
+</span></span><span style="display:flex;"><span>dflist <span style="color:#f92672">&lt;-</span> <span style="color:#a6e22e">lapply</span>(<span style="color:#a6e22e">commandArgs</span>(trailingOnly <span style="color:#f92672">=</span> <span style="color:#66d9ef">TRUE</span>), fread, sep<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;|&#34;</span>,
+</span></span><span style="display:flex;"><span>  header<span style="color:#f92672">=</span>T, select<span style="color:#f92672">=</span><span style="color:#ae81ff">1</span><span style="color:#f92672">:</span><span style="color:#ae81ff">2</span>, colClasses<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;integer64&#34;</span>)
+</span></span><span style="display:flex;"><span>  df <span style="color:#f92672">&lt;-</span> <span style="color:#a6e22e">rbindlist</span>(dflist) <span style="color:#a6e22e">setNames</span>(df, <span style="color:#a6e22e">c</span>(<span style="color:#e6db74">&#34;P1&#34;</span>, <span style="color:#e6db74">&#34;P2&#34;</span>))
+</span></span><span style="display:flex;"><span>d2 <span style="color:#f92672">&lt;-</span> df[,<span style="color:#a6e22e">length</span>(P2),by<span style="color:#f92672">=</span>P1]
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">pdf</span>(<span style="color:#e6db74">&#34;socialdegreedist.pdf&#34;</span>)
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">plot</span>(<span style="color:#a6e22e">ecdf</span>(d2<span style="color:#f92672">$</span>V1),main<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;Cummulative distribution #friends per user&#34;</span>,
+</span></span><span style="display:flex;"><span>  xlab<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;Number of friends&#34;</span>, ylab<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;Percentage number of users&#34;</span>, log<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;x&#34;</span>,
+</span></span><span style="display:flex;"><span>  xlim<span style="color:#f92672">=</span><span style="color:#a6e22e">c</span>(<span style="color:#ae81ff">0.8</span>, <span style="color:#a6e22e">max</span>(d2<span style="color:#f92672">$</span>V1) <span style="color:#f92672">+</span> <span style="color:#ae81ff">20</span>))
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">dev.off</span>()
+</span></span></code></pre></div><h3 id="data-correlations">Data Correlations</h3>
+<p>Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.</p>
+<p><em>Which are the most popular names of a country?</em></p>
+<p>We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, <em>&lsquo;A_country_name&rsquo;</em> is the name of a particular country such as  <em>&lsquo;Germany&rsquo;, &lsquo;Netherlands&rsquo;, or &lsquo;Vietnam&rsquo;</em>.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-sql" data-lang="sql"><span style="display:flex;"><span><span style="color:#66d9ef">SELECT</span> p_lastname, <span style="color:#66d9ef">count</span> (p_lastname) <span style="color:#66d9ef">as</span> namecnt 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">FROM</span> person, country 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">WHERE</span> p_placeid <span style="color:#f92672">=</span> ctry_city   
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> ctry_name <span style="color:#f92672">=</span> <span style="color:#e6db74">&#39;A_country_name&#39;</span> 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">GROUP</span> <span style="color:#66d9ef">BY</span> p_lastname <span style="color:#66d9ef">order</span> <span style="color:#66d9ef">by</span> namecnt <span style="color:#66d9ef">desc</span>;
+</span></span></code></pre></div><p>As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as <em>Muller</em> is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&rsquo; distribution may not be exactly the same as the contemporary names&rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.</p>
+<p><img src="distribution-germany.png" alt="image"> <br>
+Figure 2. Distribution of names in Germany</p>
+<p><img src="distribution-netherlands.png" alt=""> <br>
+Figure 3. Distribution of names in Netherlands</p>
+<p><img src="distribution-vietnam.png" alt=""> <br>
+Figure 4. Distribution of names in Vietnam</p>
+<p><em>Where my friends are living?</em></p>
+<p>We run the following query, which computes the locations of the friends of people living in China.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-sql" data-lang="sql"><span style="display:flex;"><span><span style="color:#66d9ef">SELECT</span> top <span style="color:#ae81ff">10</span> fctry.ctry_name, <span style="color:#66d9ef">count</span> (<span style="color:#f92672">*</span>) <span style="color:#66d9ef">from</span> person <span style="color:#66d9ef">self</span>, person
+</span></span><span style="display:flex;"><span>friend, country pctry, knows, country fctry 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">WHERE</span> pctry.ctry_name <span style="color:#f92672">=</span> <span style="color:#e6db74">&#39;China&#39;</span> 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> <span style="color:#66d9ef">self</span>.p_placeid <span style="color:#f92672">=</span> pctry.ctry_city 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> k_person1id <span style="color:#f92672">=</span> <span style="color:#66d9ef">self</span>.p_personid <span style="color:#66d9ef">and</span> friend.p_personid <span style="color:#f92672">=</span> k_person2id 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> fctry.ctry_city <span style="color:#f92672">=</span> friend.p_placeid 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">GROUP</span> <span style="color:#66d9ef">BY</span> fctry.ctry_name <span style="color:#66d9ef">ORDER</span> <span style="color:#66d9ef">BY</span> <span style="color:#ae81ff">2</span> <span style="color:#66d9ef">desc</span>;    
+</span></span></code></pre></div><p>As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.</p>
+<p><img src="chinese-friends.png" alt=""> <br>
+Figure 5. Locations of friends of people in China</p>
+<p><em>Where my friends are studying?</em></p>
+<p>Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-sql" data-lang="sql"><span style="display:flex;"><span><span style="color:#66d9ef">SELECT</span> top <span style="color:#ae81ff">10</span> o2.o_name, <span style="color:#66d9ef">count</span>(o2.o_name) <span style="color:#66d9ef">from</span> knows, person_university
+</span></span><span style="display:flex;"><span>p1, person_university p2, organisation o1, organisation o2 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">WHERE</span> 
+</span></span><span style="display:flex;"><span>  p1.pu_organisationid <span style="color:#f92672">=</span> o1.o_organisationid 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> o1.o_name<span style="color:#f92672">=</span><span style="color:#e6db74">&#39;Hangzhou_International_School&#39;</span> 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> k_person1id <span style="color:#f92672">=</span> p1.pu_personid <span style="color:#66d9ef">and</span> p2.pu_personid <span style="color:#f92672">=</span> k_person2id 
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">and</span> p2.pu_organisationid <span style="color:#f92672">=</span> o2.o_organisationid 
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">GROUP</span> <span style="color:#66d9ef">BY</span> o2.o_name <span style="color:#66d9ef">ORDER</span> <span style="color:#66d9ef">BY</span> <span style="color:#ae81ff">2</span> <span style="color:#66d9ef">desc</span>;
+</span></span></code></pre></div><p>As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).</p>
+<p><img src="friends-international-school.png" alt=""> <br>
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.</p>
+<table>
+<thead>
+<tr>
+<th>Name</th>
+<th># of friends</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Hangzhou_International_School</td>
+<td>12696</td>
+</tr>
+<tr>
+<td>Anhui_University_of_Science_and_Technology</td>
+<td>4071</td>
+</tr>
+<tr>
+<td>China_Jiliang_University</td>
+<td>3519</td>
+</tr>
+<tr>
+<td>&hellip;</td>
+<td></td>
+</tr>
+<tr>
+<td>Darmstadt_University_of_Applied_Sciences</td>
+<td>1</td>
+</tr>
+<tr>
+<td>Calcutta_School_of_Tropical_Medicine</td>
+<td>1</td>
+</tr>
+<tr>
+<td>Chettinad_Vidyashram</td>
+<td>1</td>
+</tr>
+<tr>
+<td>Women&rsquo;s_College_Shillong</td>
+<td>1</td>
+</tr>
+<tr>
+<td>Universitas_Nasional</td>
+<td>1</td>
+</tr>
+</tbody>
+</table>
+<p>Table 1. Universities where friends of Hangzhou International School students are studying at.</p>
+<p>In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/developer">DEVELOPER</a>
+            , <a href="/tags/industry">INDUSTRY</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/datagen-data-generation-for-the-social-network-benchmark/index.html b/post/datagen-data-generation-for-the-social-network-benchmark/index.html
new file mode 100644
index 00000000..5fdc233f
--- /dev/null
+++ b/post/datagen-data-generation-for-the-social-network-benchmark/index.html
@@ -0,0 +1,473 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">DATAGEN: Data Generation for the Social Network Benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">DATAGEN: Data Generation for the Social Network Benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.</p>
+<p>For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:</p>
+<ul>
+<li><strong>Realism.</strong> The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook <a href="#references">[2]</a>. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.</li>
+<li><strong>Scalability.</strong> Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.</li>
+<li><strong>Determinism.</strong> DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.</li>
+<li><strong>Usability.</strong> LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.</li>
+</ul>
+<p>Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (<a href="https://github.com/ldbc/ldbc_snb_datagen)">https://github.com/ldbc/ldbc_snb_datagen)</a>.</p>
+<h4 id="references">References</h4>
+<p>[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &ldquo;S3g2: A scalable structure-correlated social graph generator.&rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.</p>
+<p>[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &ldquo;How community-like is the structure of synthetically generated graphs?.&rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/social-network">SOCIAL NETWORK</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/elements-of-instance-matching-benchmarks-a-short-overview/index.html b/post/elements-of-instance-matching-benchmarks-a-short-overview/index.html
new file mode 100644
index 00000000..42640fe1
--- /dev/null
+++ b/post/elements-of-instance-matching-benchmarks-a-short-overview/index.html
@@ -0,0 +1,477 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Elements of Instance Matching Benchmarks: a Short Overview</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Elements of Instance Matching Benchmarks: a Short Overview</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Irini Fundulaki</strong> / on <strong class="text-dark">16 Jun 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using <strong>instance matching</strong> techniques and tools. Instance matching is also known as <strong>record linkage</strong> <a href="#references">[1]</a>, <strong>duplicate detection</strong> <a href="#references">[2]</a>, <strong>entity resolution</strong> <a href="#references">[3]</a> and <strong>object identification</strong> <a href="#references">[4]</a>.</p>
+<p>For instance, a search in Geonames (<a href="http://www.geonames.org/">http://www.geonames.org/</a>) for &ldquo;Athens&rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (<a href="http://dbpedia.org/">http://dbpedia.org/</a>) or Open Government Datasets (<a href="http://data.gov.gr/">http://data.gov.gr/</a>). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.</p>
+<p>Web resources are published by &ldquo;autonomous agents&rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years <a href="#references">[2]</a><a href="#references">[5]</a>.</p>
+<p>It is though essential at this point to develop, along with instance and entity matching systems, <em>instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs</em>. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.</p>
+<p>An instance matching benchmark for Linked Data consists of a <em>source</em> and <em>target dataset</em> implementing a set of <em>test-cases</em>, where each test case addresses a different kind of requirement regarding instance matching, a <em>ground truth</em> or <em>gold standard</em> and finally the <em>evaluation metrics</em> used to <em>assess the benchmark.</em></p>
+<p>Datasets are the raw material of a benchmark. A benchmark comprises of a <em>source</em> and <em>target</em> dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their <em>nature</em> (<em>real</em> or <em>synthetic</em>), (b) the <em>schemas/ontologies</em> they use,  (c) their <em>domains</em>,  (d) the <em>languages</em> they are written in, and (e) the <em>variations/heterogeneities</em> of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. <em>Synthetic datasets</em> are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner</p>
+<p>Datasets (and benchmarks) may contain different <em>kinds of variations</em> that correspond to <em>different test cases</em>. According to Ferrara et.al. <a href="#references">[6]</a><a href="#references">[7]</a>, three kinds of variations exist for Linked Data, namely <em>data variations</em>, <em>structural variations</em> and <em>logical variations</em>. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.</p>
+<p>The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.</p>
+<p>The <em>gold standard</em> is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.</p>
+<p>Last, an instance matching benchmark uses <em>evaluation metrics</em> to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard <em>precision</em>, <em>recall</em> and <em>f-measure</em> metrics.</p>
+<h4 id="references">References</h4>
+<p>[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.</p>
+<p>[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).</p>
+<p>[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.</p>
+<p>[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.</p>
+<p>[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.</p>
+<p>[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).</p>
+<p>[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/instance-matching">INSTANCE MATCHING</a>
+            , <a href="/tags/spb">SPB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/event-driven-post-generation-in-datagen/index.html b/post/event-driven-post-generation-in-datagen/index.html
new file mode 100644
index 00000000..e14418c8
--- /dev/null
+++ b/post/event-driven-post-generation-in-datagen/index.html
@@ -0,0 +1,498 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Event Driven Post Generation in Datagen</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Event Driven Post Generation in Datagen</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Event Driven Post Generation in Datagen</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">10 Apr 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:</p>
+<ul>
+<li>
+<p>The wall of the person</p>
+</li>
+<li>
+<p>The albums of the person</p>
+</li>
+<li>
+<p>The groups where the person is a moderator</p>
+</li>
+</ul>
+<p>We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.</p>
+<p>After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.</p>
+<p>Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &ldquo;Enrique Iglesias&rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.</p>
+<p>Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:</p>
+<ul>
+<li>
+<p>Determine the number of posts to generate</p>
+</li>
+<li>
+<p>Select a random member of the group that will generate the post</p>
+</li>
+<li>
+<p>Determine the event the post will be related to given the aforementioned cumulative distribution</p>
+</li>
+<li>
+<p>Assign the date of the post based on the event date</p>
+</li>
+</ul>
+<p>In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from <a href="#references">[1]</a>. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.</p>
+<p><img src="index.png" alt=""></p>
+<p>Following the example of &ldquo;Enrique Iglesias&rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.</p>
+<p><img src="index2.png" alt=""></p>
+<p>In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.</p>
+<h4 id="references">References</h4>
+<p>[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/social-network">SOCIAL NETWORK</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/event-driven-post-generation-in-datagen/index.png b/post/event-driven-post-generation-in-datagen/index.png
new file mode 100644
index 00000000..52f7159d
Binary files /dev/null and b/post/event-driven-post-generation-in-datagen/index.png differ
diff --git a/post/event-driven-post-generation-in-datagen/index2.png b/post/event-driven-post-generation-in-datagen/index2.png
new file mode 100644
index 00000000..213f46e6
Binary files /dev/null and b/post/event-driven-post-generation-in-datagen/index2.png differ
diff --git a/post/further-developments-in-snb-bi-workload/index.html b/post/further-developments-in-snb-bi-workload/index.html
new file mode 100644
index 00000000..ec7a6e88
--- /dev/null
+++ b/post/further-developments-in-snb-bi-workload/index.html
@@ -0,0 +1,476 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Further Developments in SNB BI Workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Further Developments in SNB BI Workload</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Further Developments in SNB BI Workload</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">18 Dec 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.</p>
+<p>Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.</p>
+<p>One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.</p>
+<p>Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.</p>
+<p>Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.</p>
+<p>An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.</p>
+<p>So, let’s see how some of these aspects could be captured in the SNB context.</p>
+<p>Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.</p>
+<p>The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.</p>
+<p>The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.</p>
+<p>In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”</p>
+<p>Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.</p>
+<p>From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.</p>
+<p>This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.</p>
+<p>There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/bi">BI</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/getting-started-with-snb/index.html b/post/getting-started-with-snb/index.html
new file mode 100644
index 00000000..e58cf4f3
--- /dev/null
+++ b/post/getting-started-with-snb/index.html
@@ -0,0 +1,501 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Getting Started With SNB</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Getting Started With SNB</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Getting Started With SNB</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the design goals that drive the development of DATAGEN, which can be summarized as: <em>Realism, Scalability, Determinism and Usability.</em></p>
+<p>DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.</p>
+<p><img src="schema.png" alt="image"></p>
+<p>For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:</p>
+<ul>
+<li>
+<p>Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.</p>
+</li>
+<li>
+<p>Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.</p>
+</li>
+</ul>
+<p>DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.</p>
+<p>Finally, DATAGEN outputs two other things:</p>
+<ul>
+<li>
+<p>Update Streams, which will be used in the future to implement updates in the workloads.</p>
+</li>
+<li>
+<p>Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.</p>
+</li>
+</ul>
+<p>Configuring and using DATAGEN is easy. Please visit <a href="https://github.com/ldbc/ldbc_snb_datagen">this page</a> for more information.</p>
+<h3 id="ldbc-driver">LDBC driver</h3>
+<p>SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.</p>
+<p>It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation <a href="https://github.com/ldbc/ldbc_driver/wiki">page</a>.</p>
+<p>The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.</p>
+<p>Given a workload consisting of a series of <em>Operations</em>, the test sponsor implements <em>OperationHandlers</em> __ for them. <em>OperationHandlers</em> are responsible of executing instances of an specific operation (query) type. This is done by overriding the method <em>executeOperation</em>(), which receives as input parameter an <em>Operation</em> instance and returns the result. From <em>Operation</em> __ instance, the operation&rsquo;s input parameters can be retrieved, as well as the database connection state.</p>
+<p>The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the <em>Db</em> interface, which consists of three methods: <em>onInit</em>(), <em>onCleanup</em>() and <em>getConnectionState</em>(). <em>onInit</em>() is called before the benchmark is executed, and is responsible of initializing the database and registering the different <em>OperationHandlers</em>. <em>onCleanup</em>() is called after the benchmark has completed. Any resources that need to be released should be released here.</p>
+<p>Finally, <em>getConnectionState</em>() returns an instance of <em>DbConnectionState</em>, which encapsulates any state that needs to be shared between <em>OperationHandler</em> instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.</p>
+<p>A good example on how to implement the benchmark can be found <a href="https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector">here</a>.</p>
+<h3 id="workloads">Workloads</h3>
+<p>Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.</p>
+<p>Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.</p>
+<p>Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.</p>
+<p>Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.</p>
+<p>Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.</p>
+<h3 id="final-remarks">Final remarks</h3>
+<p>This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification <a href="https://github.com/ldbc/ldbc_snb_docs">draft</a>, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            , <a href="/tags/datagen">DATAGEN</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/getting-started-with-snb/schema.png b/post/getting-started-with-snb/schema.png
new file mode 100644
index 00000000..5ab772b9
Binary files /dev/null and b/post/getting-started-with-snb/schema.png differ
diff --git a/post/getting-started-with-the-semantic-publishing-benchmark/index.html b/post/getting-started-with-the-semantic-publishing-benchmark/index.html
new file mode 100644
index 00000000..faf06738
--- /dev/null
+++ b/post/getting-started-with-the-semantic-publishing-benchmark/index.html
@@ -0,0 +1,685 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Getting Started With the Semantic Publishing Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Getting Started With the Semantic Publishing Benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Getting Started With the Semantic Publishing Benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Irini Fundulaki</strong> / on <strong class="text-dark">09 Nov 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.</p>
+<p>The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:</p>
+<ul>
+<li>clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)</li>
+<li>correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)</li>
+</ul>
+<p>The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.</p>
+<p>Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:</p>
+<ul>
+<li>join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema</li>
+<li>subselects that aggregate the query results that the optimiser should recognise and evaluate first</li>
+<li>optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last</li>
+<li>reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)</li>
+<li>unions to be executed in parallel</li>
+<li>optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results</li>
+<li>ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results</li>
+<li>handling of geo-spatial predicates</li>
+<li>full-text search optimisation</li>
+<li>asynchronous execution of the aggregate sub-queries</li>
+<li>use of distinct to choose the optimal query plan</li>
+</ul>
+<p>We give below Query 1 of the Semantic Publishing Benchmark.</p>
+<pre tabindex="0"><code>PREFIX bbcevent:&lt;http://www.bbc.co.uk/ontologies/event/&gt;
+PREFIX geo-pos:&lt;http://www.w3.org/2003/01/geo/wgs84_pos#&gt;
+PREFIX bbc:&lt;http://www.bbc.co.uk/ontologies/bbc/&gt;
+PREFIX time:&lt;http://www.w3.org/2006/time#&gt;
+PREFIX event:&lt;http://purl.org/NET/c4dm/event.owl#&gt;
+PREFIX music-ont:&lt;http://purl.org/ontology/mo/&gt;
+PREFIX rdf:&lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&gt;
+PREFIX foaf:&lt;http://xmlns.com/foaf/0.1/&gt;
+PREFIX provenance:&lt;http://www.bbc.co.uk/ontologies/provenance/&gt;
+PREFIX owl:&lt;http://www.w3.org/2002/07/owl#&gt;
+PREFIX cms:&lt;http://www.bbc.co.uk/ontologies/cms/&gt;
+PREFIX news:&lt;http://www.bbc.co.uk/ontologies/news/&gt;
+PREFIX cnews:&lt;http://www.bbc.co.uk/ontologies/news/cnews/&gt;
+PREFIX cconcepts:&lt;http://www.bbc.co.uk/ontologies/coreconcepts/&gt;
+PREFIX dbp-prop:&lt;http://dbpedia.org/property/&gt;
+PREFIX geonames:&lt;http://sws.geonames.org/&gt;
+PREFIX rdfs:&lt;http://www.w3.org/2000/01/rdf-schema#&gt;
+PREFIX domain:&lt;http://www.bbc.co.uk/ontologies/domain/&gt;
+PREFIX dbpedia:&lt;http://dbpedia.org/resource/&gt;
+PREFIX geo-ont:&lt;http://www.geonames.org/ontology#&gt;
+PREFIX bbc-pont:&lt;http://purl.org/ontology/po/&gt;
+PREFIX tagging:&lt;http://www.bbc.co.uk/ontologies/tagging/&gt;
+PREFIX sport:&lt;http://www.bbc.co.uk/ontologies/sport/&gt;
+PREFIX skosCore:&lt;http://www.w3.org/2004/02/skos/core#&gt;
+PREFIX dbp-ont:&lt;http://dbpedia.org/ontology/&gt;
+PREFIX xsd:&lt;http://www.w3.org/2001/XMLSchema#&gt;
+PREFIX core:&lt;http://www.bbc.co.uk/ontologies/coreconcepts/&gt;
+PREFIX curric:&lt;http://www.bbc.co.uk/ontologies/curriculum/&gt;
+PREFIX skos:&lt;http://www.w3.org/2004/02/skos/core#&gt;
+PREFIX cwork:&lt;http://www.bbc.co.uk/ontologies/creativework/&gt;
+PREFIX fb:&lt;http://rdf.freebase.com/ns/&gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+</code></pre><p>Listing 1. Semantic Publishing Benchmark: Query 1</p>
+<p>The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.</p>
+<p>The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.</p>
+<p>The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).</p>
+<p>Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.</p>
+<pre tabindex="0"><code>Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+</code></pre><p>Listing 2. A snippet of semantic_publishing_benchmark_results.log</p>
+<p>We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:</p>
+<table>
+<thead>
+<tr>
+<th>#triples</th>
+<th>Q1</th>
+<th>Q2</th>
+<th>Q3</th>
+<th>Q4</th>
+<th>Q5</th>
+<th>Q6</th>
+<th>Q7</th>
+<th>Q8</th>
+<th>Q9</th>
+<th>#queries</th>
+<th>avg. #q. per sec.</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>10M</td>
+<td>298</td>
+<td>267</td>
+<td>243</td>
+<td>291</td>
+<td>320</td>
+<td>286</td>
+<td>255</td>
+<td>274</td>
+<td>271</td>
+<td>2505</td>
+<td>41,750</td>
+</tr>
+<tr>
+<td>100M</td>
+<td>53</td>
+<td>62</td>
+<td>51</td>
+<td>52</td>
+<td>44</td>
+<td>62</td>
+<td>25</td>
+<td>55</td>
+<td>45</td>
+<td>449</td>
+<td>7,483</td>
+</tr>
+<tr>
+<td>1B</td>
+<td>34</td>
+<td>29</td>
+<td>22</td>
+<td>24</td>
+<td>25</td>
+<td>29</td>
+<td>0</td>
+<td>29</td>
+<td>28</td>
+<td>220</td>
+<td>3,667</td>
+</tr>
+</tbody>
+</table>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/spb">SPB</a>
+            , <a href="/tags/sparql">SPARQL</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/index.html b/post/index.html
new file mode 100644
index 00000000..8b917304
--- /dev/null
+++ b/post/index.html
@@ -0,0 +1,779 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/index.xml b/post/index.xml
new file mode 100644
index 00000000..90893697
--- /dev/null
+++ b/post/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Posts on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/post/</link>
+    <description>Recent content in Posts on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 26 May 2024 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/post/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png b/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png
new file mode 100644
index 00000000..00be8a59
Binary files /dev/null and b/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png differ
diff --git a/post/industry-relevance-of-the-semantic-publishing-benchmark/02_semantic_repository.png b/post/industry-relevance-of-the-semantic-publishing-benchmark/02_semantic_repository.png
new file mode 100644
index 00000000..6b034c90
Binary files /dev/null and b/post/industry-relevance-of-the-semantic-publishing-benchmark/02_semantic_repository.png differ
diff --git a/post/industry-relevance-of-the-semantic-publishing-benchmark/03_bbc_sport.png b/post/industry-relevance-of-the-semantic-publishing-benchmark/03_bbc_sport.png
new file mode 100644
index 00000000..419f5e41
Binary files /dev/null and b/post/industry-relevance-of-the-semantic-publishing-benchmark/03_bbc_sport.png differ
diff --git a/post/industry-relevance-of-the-semantic-publishing-benchmark/04_content_tagging.png b/post/industry-relevance-of-the-semantic-publishing-benchmark/04_content_tagging.png
new file mode 100644
index 00000000..cb09e563
Binary files /dev/null and b/post/industry-relevance-of-the-semantic-publishing-benchmark/04_content_tagging.png differ
diff --git a/post/industry-relevance-of-the-semantic-publishing-benchmark/index.html b/post/industry-relevance-of-the-semantic-publishing-benchmark/index.html
new file mode 100644
index 00000000..700702d2
--- /dev/null
+++ b/post/industry-relevance-of-the-semantic-publishing-benchmark/index.html
@@ -0,0 +1,571 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Industry Relevance of the Semantic Publishing Benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Industry Relevance of the Semantic Publishing Benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Atanas Kiryakov</strong> / on <strong class="text-dark">03 Mar 2015</strong></div>
+        
+        
+          <i>Why do leading media companies, like the BBC and publishers, from FT to DK and Elsevier, use triplestores?</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png"  onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post thumb" class="img-fluid w-100">
+          
+          
+        </div>
+        <div class="content">
+          <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.</p>
+<p>What’s driving this change in publishing and media?</p>
+<ul>
+<li>
+<p>Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &ldquo;commodity&rdquo; and few people are willing to pay for it</p>
+</li>
+<li>
+<p>The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;</p>
+</li>
+<li>
+<p>Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.</p>
+</li>
+</ul>
+<p><em>Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.</em></p>
+<h3 id="imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores">Imagine instant news in context, Imagine personal channels, Imagine &hellip; triplestores</h3>
+<p>While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &ldquo;near real time&rdquo; is difficult and expensive using legacy processes and content management technology.</p>
+<p>Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like <a href="http://new.dowjones.com/products/factiva/">Factiva</a>, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.</p>
+<p>Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.</p>
+<p>Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:</p>
+<ol>
+<li>Generation of rich and &ldquo;meaningful&rdquo; (trying not to use &ldquo;semantic&rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.</li>
+</ol>
+<p>In this post I write about &ldquo;semantic annotation&rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.</p>
+<h3 id="semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing">Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing</h3>
+<p>The most popular meaning of &ldquo;semantic annotation&rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.</p>
+<p><img src="02_semantic_repository.png" alt=""></p>
+<p>The concept of using <a href="http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf">text-mining for automatic semantic annotation</a> of text with respect to very large datasets, such as <a href="http://dbpedia.org/">DBPedia</a>, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &ldquo;Paris&rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &ldquo;Hilton&rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.</p>
+<p>Today there are plenty of tools (such as the <a href="https://www.ontotext.com/semantic-solutions/media-publishing/">Ontotext Media and Publishing</a> platform and <a href="https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki">DBPedia Spotlight</a>) and services (such as Thomson Reuter’s <a href="http://www.opencalais.com/">OpenCalais</a> and Ontotext’s <a href="http://s4.ontotext.com">S4</a>) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.</p>
+<h3 id="the-bbcs-dynamic-semantic-publishing-dsp">The BBC’s Dynamic Semantic Publishing (DSP)</h3>
+<p>Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.</p>
+<p>BBC Future Media &amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.</p>
+<p><em>&ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&rdquo;.</em> &ndash; <a href="http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">Jem Rayfield, Senior Technical Architect</a>, BBC News and Knowledge</p>
+<p>The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&ldquo;edited by exception&rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.</p>
+<p><em>&ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language">natural language and ontological determiner process</a> automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.</em></p>
+<p><img src="03_bbc_sport.png" alt=""></p>
+<p><em>Journalist-published metadata is captured and made persistent for querying using the resource description framework (<a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF"><em>RDF</em></a>) metadata representation and triple store technology. <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM">A RDF triplestore</a> and <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL">SPARQL</a> approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &ldquo;Frank Lampard&rdquo;, then the framework infers and applies concepts such as &ldquo;England Squad&rdquo;, &ldquo;Group C&rdquo; and &ldquo;FIFA World Cup 2010&rdquo; &hellip;&rdquo;</em> &ndash; Jem Rayfield</p>
+<p>One can consider each of the &ldquo;aggregation pages&rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.</p>
+<p><em>&ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content</em></p>
+<p><strong>…</strong><strong><em>we are not publishing pages, but publishing content</em></strong> <em>as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.</em></p>
+<p><img src="04_content_tagging.png" alt=""></p>
+<p><em>… The index pages are published automatically. This process is what assures us of the highest quality output, but still <strong>save large amounts of time</strong> in managing the site and <strong>makes it possible for us to efficiently run so many pages</strong> for the World Cup.&rdquo;</em> &ndash; <a href="http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html">John O&rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp; Technology</a></p>
+<p>To get a real feeling about the load of the triplestore behind BBC&rsquo;s World Cup web site, here are some statistics:</p>
+<ul>
+<li>
+<p>800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;</p>
+</li>
+<li>
+<p>Average unique page requests/day: 2 million;</p>
+</li>
+<li>
+<p>Average <strong>SPARQL queries/day: 1 million;</strong></p>
+</li>
+<li>
+<p><strong>100s repository updates/inserts per minute</strong> with OWL 2 RL reasoning;</p>
+</li>
+<li>
+<p>Multi data center that is fully resilient, clustered 6 node triplestore.</p>
+</li>
+</ul>
+<h3 id="the-semantic-publishing-benchmark">The Semantic Publishing Benchmark</h3>
+<p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).</p>
+<p>SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:</p>
+<ul>
+<li>
+<p><em>Reference knowledge:</em> taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);</p>
+</li>
+<li>
+<p><em>Metadata</em> for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.</p>
+</li>
+</ul>
+<p>In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:</p>
+<ul>
+<li>
+<p><em>Aggregation queries</em> retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;</p>
+</li>
+<li>
+<p><em>Updates</em>, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.</p>
+</li>
+</ul>
+<p>SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from <a href="http://www.geonames.org/">Geonames</a> for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.</p>
+<p>A more technical introduction to SPB can be found in this <a href="/post/getting-started-with-the-semantic-publishing-benchmark">post</a>. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">post</a>. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.</p>
+<p>Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &ldquo;fast flowing&rdquo; content need to be &ldquo;dispatched&rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:</p>
+<ul>
+<li>
+<p>The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;</p>
+</li>
+<li>
+<p>Reasoning is needed to map content descriptions to queries in a flexible manner;</p>
+</li>
+<li>
+<p>There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.</p>
+</li>
+</ul>
+<h3 id="spb-v20--steeper-for-the-engines-closer-to-the-publishers">SPB v.2.0 – steeper for the engines, closer to the publishers</h3>
+<p>We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.</p>
+<p>The major changes in SPB v.2.0 can be summarized as follows:</p>
+<ul>
+<li>
+<p>Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;</p>
+</li>
+<li>
+<p>Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;</p>
+</li>
+<li>
+<p>Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.</p>
+</li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/industry">INDUSTRY</a>
+            , <a href="/tags/spb">SPB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/index.html b/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/index.html
new file mode 100644
index 00000000..5f853169
--- /dev/null
+++ b/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/index.html
@@ -0,0 +1,470 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.</p>
+<p>SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.</p>
+<p>The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.</p>
+<p>The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.</p>
+<p>The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.</p>
+<p>Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&rsquo;s.</p>
+<p>SNB Interactive is an example of LDBC&rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art</p>
+<p>The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.</p>
+<p>Subsequent posts will address the workload in more detail.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg b/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg
new file mode 100644
index 00000000..ef296460
Binary files /dev/null and b/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg differ
diff --git a/post/is-snb-like-facebooks-linkbench/index.html b/post/is-snb-like-facebooks-linkbench/index.html
new file mode 100644
index 00000000..206de9f9
--- /dev/null
+++ b/post/is-snb-like-facebooks-linkbench/index.html
@@ -0,0 +1,504 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Is SNB Like Facebooks LinkBench</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Is SNB Like Facebooks LinkBench</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Is SNB Like Facebooks LinkBench</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+          <i>This table shows which kind of graph data management system might be tested for the three different  SNB workloads.</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg"  onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post thumb" class="img-fluid w-100">
+          
+          
+        </div>
+        <div class="content">
+          <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&rsquo;s own graph benchmark called <a href="https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920">LinkBench</a>. We think SNB is the most intricate graph database benchmark to date (it&rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference <a href="http://www.sigmod2014.org/">SIGMOD in Snowbird</a> after being used for this year&rsquo;s <a href="https://arxiv.org/pdf/2010.12243.pdf">ACM SIGMOD Programming Contest</a>, which was about graph analytics.</p>
+<p>SNB is intended to provide the following <strong>value</strong> to different stakeholders:</p>
+<ul>
+<li>
+<p>For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to <em>compare merits of different products</em> and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.</p>
+</li>
+<li>
+<p>For vendors of graph database technology, SNB provides a <em>checklist of features</em> and performance characteristics that helps in product positioning and can serve to guide new development.</p>
+</li>
+<li>
+<p>For researchers, both industrial and academic, the SNB dataset and workload provide <em>interesting challenges</em> in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.</p>
+</li>
+</ul>
+<p>I should clarify that even though the data model of SNB resembles Facebook (and we&rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the <em>connection patterns</em> between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:</p>
+<ul>
+<li>
+<p>the benchmark scenario should be <strong>understandable</strong> to a large audience, and this audience should also understand the relevance of managing such data.</p>
+</li>
+<li>
+<p>the scenario in the benchmark should cover the complete range of challenges <strong>relevant</strong> for graph data management, according to the benchmark scope.</p>
+</li>
+<li>
+<p>the query challenges in it should be <strong>realistic</strong> in the sense that, though synthetic, similar data and workloads are encountered in practice.</p>
+</li>
+</ul>
+<p>The SNB is in fact three distinct benchmarks with a common dataset, since there are <em>three different workloads</em>. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.</p>
+<ul>
+<li>
+<p><strong>Interactive Workload.</strong>  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the <a href="https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen">data generator</a> and  <a href="https://github.com/ldbc/ldbc_driver">driver software stack</a> are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.</p>
+</li>
+<li>
+<p><strong>Business Intelligence Workload.</strong> There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.</p>
+</li>
+<li>
+<p><strong>Graph Analytics Workload.</strong> This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.</p>
+</li>
+</ul>
+<p>All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art <a href="https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen">data generator</a>. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to <a href="http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf">LinkBench</a>, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the <strong>low-level</strong> MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that <a href="http://borthakur.com/ftp/sigmod2013.pdf">Facebook&rsquo;s IT infrastructure</a> does not store all user data in MySQL and its modified memcached (&quot;<a href="http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf">TAO</a>&quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it <strong>does</strong> matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with <em>correlations</em>, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &ldquo;choke point&rdquo; for graph data management system where LDBC wants to stimulate innovation).</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/developer">DEVELOPER</a>
+            , <a href="/tags/snb">SNB</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            , <a href="/tags/bi">BI</a>
+            , <a href="/tags/graphalytics">GRAPHALYTICS</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-and-apache-flink/index.html b/post/ldbc-and-apache-flink/index.html
new file mode 100644
index 00000000..9c8ffcde
--- /dev/null
+++ b/post/ldbc-and-apache-flink/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC and Apache Flink</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC and Apache Flink</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC and Apache Flink</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Martin Junghanns</strong> / on <strong class="text-dark">16 Nov 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.</p>
+<p>The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-java" data-lang="java"><span style="display:flex;"><span>DataSet<span style="color:#f92672">&lt;</span>String<span style="color:#f92672">&gt;</span> text <span style="color:#f92672">=</span> env<span style="color:#f92672">.</span><span style="color:#a6e22e">fromElements</span><span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;He who controls the past controls the future.&#34;</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;He who controls the present controls the past.&#34;</span><span style="color:#f92672">);</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>DataSet<span style="color:#f92672">&lt;</span>Tuple2<span style="color:#f92672">&lt;</span>String<span style="color:#f92672">,</span> Integer<span style="color:#f92672">&gt;&gt;</span> wordCounts <span style="color:#f92672">=</span> text
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">.</span><span style="color:#a6e22e">flatMap</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> LineSplitter<span style="color:#f92672">())</span> <span style="color:#75715e">// splits the line and outputs (word,1)
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>
+</span></span><span style="display:flex;"><span>tuples<span style="color:#f92672">.</span><span style="color:#a6e22e">groupBy</span><span style="color:#f92672">(</span><span style="color:#ae81ff">0</span><span style="color:#f92672">)</span> <span style="color:#75715e">// group by word
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>  <span style="color:#f92672">.</span><span style="color:#a6e22e">sum</span><span style="color:#f92672">(</span><span style="color:#ae81ff">1</span><span style="color:#f92672">);</span> <span style="color:#75715e">// sum the 1&#39;s
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>
+</span></span><span style="display:flex;"><span>wordCounts<span style="color:#f92672">.</span><span style="color:#a6e22e">print</span><span style="color:#f92672">();</span>
+</span></span></code></pre></div><p>At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop <a href="#references">[2]</a>. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing <a href="#references">[3]</a>. Using the class <code>LDBCToFlink</code>, LDBC output files can be read directly from HDFS or from the local file system:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-java" data-lang="java"><span style="display:flex;"><span><span style="color:#66d9ef">final</span> ExecutionEnvironment env <span style="color:#f92672">=</span>
+</span></span><span style="display:flex;"><span>  ExecutionEnvironment<span style="color:#f92672">.</span><span style="color:#a6e22e">getExecutionEnvironment</span><span style="color:#f92672">();</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">final</span> LDBCToFlink ldbcToFlink <span style="color:#f92672">=</span> <span style="color:#66d9ef">new</span> LDBCToFlink<span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;hdfs:///ldbc_snb_datagen/social_network&#34;</span><span style="color:#f92672">,</span> <span style="color:#75715e">// or &#34;/path/to/social_network&#34;
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>  env<span style="color:#f92672">);</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>DataSet<span style="color:#f92672">&lt;</span>LDBCVertex<span style="color:#f92672">&gt;</span> vertices <span style="color:#f92672">=</span> ldbcToFlink<span style="color:#f92672">.</span><span style="color:#a6e22e">getVertices</span><span style="color:#f92672">();</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>DataSet<span style="color:#f92672">&lt;</span>LDBCEdge<span style="color:#f92672">&gt;</span> edges <span style="color:#f92672">=</span> ldbcToFlink<span style="color:#f92672">.</span><span style="color:#a6e22e">getEdges</span><span style="color:#f92672">();</span>
+</span></span></code></pre></div><p>The tuple classes <code>LDBCVertex</code> and <code>LDBCEdge</code> hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.</p>
+<p>Each <code>LDBCVertex</code> instance contains:</p>
+<ul>
+<li>an identifier, which is unique among all vertices * a vertex label (e.g. <code>Person</code>, <code>Comment</code>) * a key-value map of properties including also multivalued properties<br>
+(e.g. <code>Person.email</code>)</li>
+</ul>
+<p>Each <code>LDBCEdge</code> instance contains:</p>
+<ul>
+<li>an identifier, which is unique among all edges</li>
+<li>an edge label (e.g. <code>knows</code>, <code>likes</code>)</li>
+<li>a source vertex identifier</li>
+<li>a target vertex identifier</li>
+<li>a key-value map of properties</li>
+</ul>
+<p>The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label <code>Person</code> and edges with the label <code>knows</code> and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub <a href="#references">[4]</a>.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-java" data-lang="java"><span style="display:flex;"><span><span style="color:#66d9ef">final</span> ExecutionEnvironment env <span style="color:#f92672">=</span>
+</span></span><span style="display:flex;"><span>  ExecutionEnvironment<span style="color:#f92672">.</span><span style="color:#a6e22e">getExecutionEnvironment</span><span style="color:#f92672">();</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">final</span> LDBCToFlink ldbcToFlink <span style="color:#f92672">=</span> <span style="color:#66d9ef">new</span> LDBCToFlink<span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&#34;</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>  env<span style="color:#f92672">);</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// filter vertices with label “Person”
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>DataSet<span style="color:#f92672">&lt;</span>LDBCVertex<span style="color:#f92672">&gt;</span> ldbcVertices <span style="color:#f92672">=</span> ldbcToFlink<span style="color:#f92672">.</span><span style="color:#a6e22e">getVertices</span><span style="color:#f92672">()</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">.</span><span style="color:#a6e22e">filter</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> VertexLabelFilter<span style="color:#f92672">(</span>LDBCConstants<span style="color:#f92672">.</span><span style="color:#a6e22e">VERTEX_CLASS_PERSON</span><span style="color:#f92672">));</span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// filter edges with label “knows”
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>DataSet<span style="color:#f92672">&lt;</span>LDBCEdge<span style="color:#f92672">&gt;</span> ldbcEdges <span style="color:#f92672">=</span> ldbcToFlink<span style="color:#f92672">.</span><span style="color:#a6e22e">getEdges</span><span style="color:#f92672">()</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">.</span><span style="color:#a6e22e">filter</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> EdgeLabelFilter<span style="color:#f92672">(</span>LDBCConstants<span style="color:#f92672">.</span><span style="color:#a6e22e">EDGE_CLASS_KNOWS</span><span style="color:#f92672">));</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// create Gelly vertices suitable for connected components
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>DataSet<span style="color:#f92672">&lt;</span>Vertex<span style="color:#f92672">&lt;</span>Long<span style="color:#f92672">,</span> Long<span style="color:#f92672">&gt;&gt;</span> vertices <span style="color:#f92672">=</span> ldbcVertices<span style="color:#f92672">.</span><span style="color:#a6e22e">map</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> VertexInitializer<span style="color:#f92672">());</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// create Gelly edges suitable for connected components
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>DataSet<span style="color:#f92672">&lt;</span>Edge<span style="color:#f92672">&lt;</span>Long<span style="color:#f92672">,</span> NullValue<span style="color:#f92672">&gt;&gt;</span> edges <span style="color:#f92672">=</span> ldbcEdges<span style="color:#f92672">.</span><span style="color:#a6e22e">map</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> EdgeInitializer<span style="color:#f92672">());</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// create Gelly graph
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>Graph<span style="color:#f92672">&lt;</span>Long<span style="color:#f92672">,</span> Long<span style="color:#f92672">,</span> NullValue<span style="color:#f92672">&gt;</span> g <span style="color:#f92672">=</span> Graph<span style="color:#f92672">.</span><span style="color:#a6e22e">fromDataSet</span><span style="color:#f92672">(</span>vertices<span style="color:#f92672">,</span> edges<span style="color:#f92672">,</span> env<span style="color:#f92672">);</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// run connected components on the subgraph for 10 iterations
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>DataSet<span style="color:#f92672">&lt;</span>Vertex<span style="color:#f92672">&lt;</span>Long<span style="color:#f92672">,</span> Long<span style="color:#f92672">&gt;&gt;</span> components <span style="color:#f92672">=</span>
+</span></span><span style="display:flex;"><span>  g<span style="color:#f92672">.</span><span style="color:#a6e22e">run</span><span style="color:#f92672">(</span><span style="color:#66d9ef">new</span> ConnectedComponents<span style="color:#f92672">&lt;</span>Long<span style="color:#f92672">,</span> NullValue<span style="color:#f92672">&gt;(</span><span style="color:#ae81ff">10</span><span style="color:#f92672">));</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// print the component id of the first 10 vertices
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>components<span style="color:#f92672">.</span><span style="color:#a6e22e">first</span><span style="color:#f92672">(</span><span style="color:#ae81ff">10</span><span style="color:#f92672">).</span><span style="color:#a6e22e">print</span><span style="color:#f92672">();</span>
+</span></span></code></pre></div><p>The ldbc-flink-import tool is available on Github <a href="#references">[3]</a> and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.</p>
+<p>If you want to learn more about Apache Flink, a good starting point is the main documentation <a href="#references">[5]</a> and if you have any question feel free to ask the official mailing lists.<br>
+There is also a nice set of videos <a href="#references">[6]</a> available from the latest Flink Forward conference.</p>
+<h4 id="references">References</h4>
+<p>[1] <a href="http://flink.apache.org/">http://flink.apache.org/</a></p>
+<p>[2] <a href="https://github.com/dbs-leipzig/gradoop">https://github.com/dbs-leipzig/gradoop</a></p>
+<p>[3] <a href="https://github.com/s1ck/ldbc-flink-import">https://github.com/s1ck/ldbc-flink-import</a></p>
+<p>[4] <a href="https://gist.github.com/s1ck/b33e6a4874c15c35cd16">https://gist.github.com/s1ck/b33e6a4874c15c35cd16</a></p>
+<p>[5] <a href="https://ci.apache.org/projects/flink/flink-docs-release-0.10/">https://ci.apache.org/projects/flink/flink-docs-release-0.10/</a></p>
+<p>[6] <a href="https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA">https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA</a></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/flink">FLINK</a>
+            , <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-announces-open-source-gql-tools/index.html b/post/ldbc-announces-open-source-gql-tools/index.html
new file mode 100644
index 00000000..42e3f18e
--- /dev/null
+++ b/post/ldbc-announces-open-source-gql-tools/index.html
@@ -0,0 +1,460 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Launching open source language tools for ISO/IEC GQL</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Launching open-source language tools for ISO/IEC GQL</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Launching open-source language tools for ISO/IEC GQL</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Alastair Green, Vice-chair of LDBC</strong> / on <strong class="text-dark">09 May 2024</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/gql">GQL</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG b/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG
new file mode 100644
index 00000000..7d856453
Binary files /dev/null and b/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG differ
diff --git a/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/index.html b/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/index.html
new file mode 100644
index 00000000..bee63160
--- /dev/null
+++ b/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/index.html
@@ -0,0 +1,468 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Peter Boncz</strong> / on <strong class="text-dark">06 Sep 2016</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG"  onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post thumb" class="img-fluid w-100">
+          
+          
+        </div>
+        <div class="content">
+          <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.</p>
+<p>Tim Hegeman of <a href="https://www.tudelft.nl">TU Delft</a> is today presenting the technical paper describing LDBC Graphalytics at the important <a href="https://www.vldb.org/conference.html">VLDB</a> (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.</p>
+<p>LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.</p>
+<p>Learn more: [/ldbc-graphalytics](LDBC Graphalytics)</p>
+<p>GitHub: <a href="https://github.com/tudelft-atlarge/graphalytics">https://github.com/tudelft-atlarge/graphalytics</a></p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/benchmark">BENCHMARK</a>
+            , <a href="/tags/tu-delft">TU DELFT</a>
+            , <a href="/tags/graphalytics">GRAPHALYTICS</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/index.html b/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/index.html
new file mode 100644
index 00000000..26ff382c
--- /dev/null
+++ b/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/index.html
@@ -0,0 +1,467 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Damaris Coll</strong> / on <strong class="text-dark">25 May 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive Workload</em> by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).</p>
+<p>You can read more about the <a href="/benchmarks/snb">Social Network Benchmark here</a> and collaborate if you&rsquo;re interested!</p>
+<p>The other presentation will be at the GRADES workshop within the SIGMOD program regarding <em>Graphalytics: A Big Data Benchmark for Graph-Processing platforms</em> by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.</p>
+<p>Don&rsquo;t forget to check our presentations if you&rsquo;re attending the SIGMOD!</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/sigmod">SIGMOD</a>
+            , <a href="/tags/grades">GRADES</a>
+            , <a href="/tags/snb">SNB</a>
+            , <a href="/tags/graphalytics">GRAPHALYTICS</a>
+            , <a href="/tags/workshop">WORKSHOP</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.png b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.png
new file mode 100644
index 00000000..8f2d6a79
Binary files /dev/null and b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.png differ
diff --git a/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.svg b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.svg
new file mode 100644
index 00000000..7c6872f7
--- /dev/null
+++ b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/activity.svg
@@ -0,0 +1,3 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="691px" height="101px" viewBox="-0.5 -0.5 691 101"><defs/><g><path d="M 120 80 L 153.63 80" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 158.88 80 L 151.88 83.5 L 153.63 80 L 151.88 76.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="0" y="60" width="120" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 118px; height: 1px; padding-top: 80px; margin-left: 1px;"><div data-drawio-colors="color: rgb(0, 0, 0); " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal;">activityOS:<br />RecordOS[Activity]</div></div></div></foreignObject><text x="60" y="84" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="12px" text-anchor="middle">activityOS:...</text></switch></g><rect x="160" y="0" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="160" y="10" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="160" y="20" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="160" y="30" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="160" y="40" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="160" y="50" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><path d="M 270 80 L 313.63 80" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 318.88 80 L 311.88 83.5 L 313.63 80 L 311.88 76.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="160" y="60" width="110" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 108px; height: 1px; padding-top: 80px; margin-left: 161px;"><div data-drawio-colors="color: rgb(0, 0, 0); " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal;">forumOS:<br />RecordOS[Forum]</div></div></div></foreignObject><text x="215" y="84" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="12px" text-anchor="middle">forumOS:...</text></switch></g><path d="M 480 80 L 523.63 80" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 528.88 80 L 521.88 83.5 L 523.63 80 L 521.88 76.5 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="320" y="60" width="160" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 158px; height: 1px; padding-top: 80px; margin-left: 321px;"><div data-drawio-colors="color: rgb(0, 0, 0); " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal;">batchOS:<br />FixedSizeBatchOS[Forum]</div></div></div></foreignObject><text x="400" y="84" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="12px" text-anchor="middle">batchOS:...</text></switch></g><rect x="530" y="30" width="160" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="530" y="40" width="160" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="530" y="50" width="160" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><rect x="530" y="60" width="160" height="40" rx="6" ry="6" fill="rgb(255, 255, 255)" stroke="rgb(0, 0, 0)" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 158px; height: 1px; padding-top: 80px; margin-left: 531px;"><div data-drawio-colors="color: rgb(0, 0, 0); " style="box-sizing: border-box; font-size: 0px; text-align: center;"><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal;">partN:<br />CsvRecordOS[Forum]</div></div></div></foreignObject><text x="610" y="84" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="12px" text-anchor="middle">partN:...</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems" target="_blank"><text text-anchor="middle" font-size="10px" x="50%" y="100%">Text is not SVG - cannot display</text></a></switch></svg>
\ No newline at end of file
diff --git a/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.png b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.png
new file mode 100644
index 00000000..5dfa3856
Binary files /dev/null and b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.png differ
diff --git a/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.svg b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.svg
new file mode 100644
index 00000000..c633aa06
--- /dev/null
+++ b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/datagen_df_0.svg
@@ -0,0 +1,3 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="522px" height="362px" viewBox="-0.5 -0.5 522 362"><defs/><g><path d="M 161 161 L 161 121 C 161 115.48 187.86 111 221 111 C 254.14 111 281 115.48 281 121 L 281 161 C 281 166.52 254.14 171 221 171 C 187.86 171 161 166.52 161 161 Z" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><path d="M 161 121 C 161 126.52 187.86 131 221 131 C 254.14 131 281 126.52 281 121" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 118px; height: 1px; padding-top: 141px; margin-left: 162px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Raw IR</div></div></div></foreignObject><text x="221" y="145" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Raw IR</text></switch></g><rect x="156" y="21" width="130" height="50" rx="7" ry="7" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 46px; margin-left: 157px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Dataset Generation</div></div></div></foreignObject><text x="221" y="50" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Dataset Generation</text></switch></g><path d="M 221 71 L 221 104.63" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 221 109.88 L 217.5 102.88 L 221 104.63 L 224.5 102.88 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="1" y="211" width="130" height="50" rx="7" ry="7" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 236px; margin-left: 2px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Dataset Transformation</div></div></div></foreignObject><text x="66" y="240" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Dataset Transforma...</text></switch></g><rect x="311" y="211" width="130" height="50" rx="7" ry="7" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 236px; margin-left: 312px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Factor Generation</div></div></div></foreignObject><text x="376" y="240" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Factor Generation</text></switch></g><path d="M 161 162 L 66 162 L 66 204.63" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 66 209.88 L 62.5 202.88 L 66 204.63 L 69.5 202.88 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><path d="M 281 162 L 376 162 L 376 204.63" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 376 209.88 L 372.5 202.88 L 376 204.63 L 379.5 202.88 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><rect x="391" y="1" width="130" height="90" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-dasharray="2 4" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 46px; margin-left: 392px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;"><div style="font-size: 14px;" align="left">- Java/Scala<br style="font-size: 14px;" /></div><div style="font-size: 14px;" align="left">- RDD</div><div style="font-size: 14px;" align="left">- custom serializer<br style="font-size: 14px;" /></div></div></div></div></foreignObject><text x="456" y="50" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">- Java/Scala...</text></switch></g><path d="M 286 46 L 391 46" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/><rect x="391" y="96" width="130" height="90" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-dasharray="2 4" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 141px; margin-left: 392px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;"><div style="font-size: 14px;" align="left">- for internal use</div><div style="font-size: 14px;" align="left">- Parquet (formerly CSV)<br style="font-size: 14px;" /></div></div></div></div></foreignObject><text x="456" y="145" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">- for internal use...</text></switch></g><path d="M 281 141 L 391 141" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/><path d="M 6 351 L 6 311 C 6 305.48 32.86 301 66 301 C 99.14 301 126 305.48 126 311 L 126 351 C 126 356.52 99.14 361 66 361 C 32.86 361 6 356.52 6 351 Z" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><path d="M 6 311 C 6 316.52 32.86 321 66 321 C 99.14 321 126 316.52 126 311" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 118px; height: 1px; padding-top: 331px; margin-left: 7px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Output</div></div></div></foreignObject><text x="66" y="335" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Output</text></switch></g><path d="M 66 261 L 66 294.63" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 66 299.88 L 62.5 292.88 L 66 294.63 L 69.5 292.88 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><path d="M 376 261 L 376 294.63" fill="none" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="stroke"/><path d="M 376 299.88 L 372.5 292.88 L 376 294.63 L 379.5 292.88 Z" fill="rgb(0, 0, 0)" stroke="rgb(0, 0, 0)" stroke-miterlimit="10" pointer-events="all"/><path d="M 316 351 L 316 311 C 316 305.48 342.86 301 376 301 C 409.14 301 436 305.48 436 311 L 436 351 C 436 356.52 409.14 361 376 361 C 342.86 361 316 356.52 316 351 Z" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><path d="M 316 311 C 316 316.52 342.86 321 376 321 C 409.14 321 436 316.52 436 311" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 118px; height: 1px; padding-top: 331px; margin-left: 317px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;">Factor tables</div></div></div></foreignObject><text x="376" y="335" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">Factor tables</text></switch></g><rect x="156" y="191" width="130" height="90" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-dasharray="2 4" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 236px; margin-left: 157px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;"><div style="font-size: 14px;">reader, writer, transformation pipeline in SparkSQL<br /></div></div></div></div></foreignObject><text x="221" y="240" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">reader, writer, tr...</text></switch></g><path d="M 131 236 L 156 236" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/><path d="M 286 236 L 311 236" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/><rect x="156" y="316" width="130" height="30" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-dasharray="2 4" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 128px; height: 1px; padding-top: 331px; margin-left: 157px;"><div style="box-sizing: border-box; font-size: 0px; text-align: center;" data-drawio-colors="color: rgb(0, 0, 0); "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; pointer-events: all; white-space: normal; overflow-wrap: normal;"><div style="font-size: 14px;">CSV or parquet<br /></div></div></div></div></foreignObject><text x="221" y="335" fill="rgb(0, 0, 0)" font-family="Helvetica" font-size="14px" text-anchor="middle">CSV or parquet&#xa;</text></switch></g><path d="M 126 331 L 156 331" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/><path d="M 286 331 L 316 331" fill="none" stroke="rgb(0, 0, 0)" stroke-width="2" stroke-miterlimit="10" stroke-dasharray="2 6" pointer-events="stroke"/></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems" target="_blank"><text text-anchor="middle" font-size="10px" x="50%" y="100%">Text is not SVG - cannot display</text></a></switch></svg>
\ No newline at end of file
diff --git a/post/ldbc-snb-datagen-the-winding-path-to-sf100k/index.html b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/index.html
new file mode 100644
index 00000000..fea65ca5
--- /dev/null
+++ b/post/ldbc-snb-datagen-the-winding-path-to-sf100k/index.html
@@ -0,0 +1,718 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC SNB Datagen – The winding path to SF100K</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC SNB Datagen – The winding path to SF100K</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC SNB Datagen – The winding path to SF100K</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-color"><a href="https://www.linkedin.com/in/dszakallas/">Dávid Szakállas</a></strong> / on <strong class="text-dark">13 Sep 2022</strong></div>
+        
+        
+          <i>Guest post.</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.</p>
+<h1 id="moving-to-sparksql">Moving to SparkSQL</h1>
+<p>We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&rsquo;s capabilites.</p>
+<blockquote>
+<p>Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.</p>
+</blockquote>
+<p>Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees<sup id="fnref:1"><a href="#fn:1" class="footnote-ref" role="doc-noteref">1</a></sup>, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:</p>
+<ol>
+<li>table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;</li>
+<li>deriving the Interactive and BI datasets;</li>
+<li>and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.</li>
+</ol>
+<p>We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.</p>
+<p><img src="datagen_df_0.png" alt="Datagen stages"></p>
+<p>The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&rsquo;s no simple way to avoid<br>
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.</p>
+<p>I&rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">previous blogpost in the series</a> or the <a href="https://arxiv.org/abs/2001.02299">Interactive benchmark specification</a>.</p>
+<h1 id="transformation-pipeline">Transformation pipeline</h1>
+<p>The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:</p>
+<ul>
+<li>explodes edges and / or attributes into separate tables,</li>
+<li>subsets the snapshot part and creates insert / delete batches for the BI workload,</li>
+<li>subsets the snapshot part for the Interactive workload,</li>
+<li>applies formatting related options such as date time representation,</li>
+<li>serializes the data to a Spark supported format (CSV, Parquet),</li>
+</ul>
+<p>We utilize a flexible data pipeline that operates on the graph.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">trait</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M1</span> <span style="color:#66d9ef">&lt;:</span> <span style="color:#66d9ef">Mode</span>, <span style="color:#66d9ef">M2</span> <span style="color:#66d9ef">&lt;:</span> <span style="color:#66d9ef">Mode</span><span style="color:#f92672">]</span> <span style="color:#a6e22e">extends</span> <span style="color:#f92672">(</span><span style="color:#a6e22e">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M1</span><span style="color:#f92672">]</span> <span style="color:#66d9ef">=&gt;</span> <span style="color:#a6e22e">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M2</span><span style="color:#f92672">])</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">In</span>  <span style="color:#f92672">=</span> <span style="color:#a6e22e">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M1</span><span style="color:#f92672">]</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#a6e22e">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M2</span><span style="color:#f92672">]</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> apply<span style="color:#f92672">(</span>v<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M1</span><span style="color:#f92672">])</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M2</span><span style="color:#f92672">]</span> <span style="color:#66d9ef">=</span> transform<span style="color:#f92672">(</span>v<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span></code></pre></div><p>The <code>Transform</code> trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&rsquo;s see some of the transformations we have.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">RawToBiTransform</span><span style="color:#f92672">(</span>mode<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">BI</span><span style="color:#f92672">,</span> simulationStart<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Long</span><span style="color:#f92672">,</span> simulationEnd<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Long</span><span style="color:#f92672">,</span> keepImplicitDeletes<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Boolean</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span>, <span style="color:#66d9ef">Mode.BI</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#f92672">???</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">RawToInteractiveTransform</span><span style="color:#f92672">(</span>mode<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Mode.Interactive</span><span style="color:#f92672">,</span> simulationStart<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Long</span><span style="color:#f92672">,</span> simulationEnd<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Long</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span>, <span style="color:#66d9ef">Mode.Interactive</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#f92672">???</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">object</span> <span style="color:#a6e22e">ExplodeEdges</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span>, <span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#f92672">???</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">object</span> <span style="color:#a6e22e">ExplodeAttrs</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span>, <span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#f92672">???</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span></code></pre></div><p>Therefore, a transformation pipeline may look like this:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">val</span> transform <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">ExplodeAttrs</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">.</span>andThen<span style="color:#f92672">(</span><span style="color:#a6e22e">ExplodeEdges</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">.</span>andThen<span style="color:#f92672">(</span><span style="color:#a6e22e">RawToInteractiveTransform</span><span style="color:#f92672">(</span>params<span style="color:#f92672">,</span> start<span style="color:#f92672">,</span> end<span style="color:#f92672">))</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> outputGraph <span style="color:#66d9ef">=</span> transform<span style="color:#f92672">(</span>inputGraph<span style="color:#f92672">)</span>
+</span></span></code></pre></div><p>The <code>Graph</code> record has a <code>definition</code> field containing graph-global metadata, whereas <code>entities</code> holds the datasets keyed by their entity type. There are 3 graph <em>modes</em> currently: <code>Raw</code>, <code>Interactive</code> and <code>BI</code>. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the <code>Layout</code> dependent type, over which the entities are polymorphic.</p>
+<p>It&rsquo;s important to understand that <code>Graph</code> holds <code>DataFrame</code>s, and these are lazily computed by Spark. So, <code>Graph</code> is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">GraphDef</span><span style="color:#f92672">[</span><span style="color:#66d9ef">+M</span> <span style="color:#66d9ef">&lt;:</span> <span style="color:#66d9ef">Mode</span><span style="color:#f92672">](</span>
+</span></span><span style="display:flex;"><span>    isAttrExploded<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Boolean</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>    isEdgesExploded<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Boolean</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>    useTimestamp<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Boolean</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>    mode<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">M</span><span style="color:#f92672">,</span>
+</span></span><span style="display:flex;"><span>    entities<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Map</span><span style="color:#f92672">[</span><span style="color:#66d9ef">EntityType</span>, <span style="color:#66d9ef">Option</span><span style="color:#f92672">[</span><span style="color:#66d9ef">String</span><span style="color:#f92672">]]</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">+M</span> <span style="color:#66d9ef">&lt;:</span> <span style="color:#66d9ef">Mode</span><span style="color:#f92672">](</span>
+</span></span><span style="display:flex;"><span>    definition<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">GraphDef</span><span style="color:#f92672">[</span><span style="color:#66d9ef">M</span><span style="color:#f92672">],</span>
+</span></span><span style="display:flex;"><span>    entities<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Map</span><span style="color:#f92672">[</span><span style="color:#66d9ef">EntityType</span>, <span style="color:#66d9ef">M</span><span style="color:#66d9ef">#</span><span style="color:#66d9ef">Layout</span><span style="color:#f92672">]</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">sealed</span> <span style="color:#66d9ef">trait</span> <span style="color:#a6e22e">Mode</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Layout</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#75715e">/* ... */</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">object</span> <span style="color:#a6e22e">Mode</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">final</span> <span style="color:#66d9ef">case</span> <span style="color:#66d9ef">object</span> <span style="color:#a6e22e">Raw</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Mode</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Layout</span> <span style="color:#f92672">=</span> <span style="color:#a6e22e">DataFrame</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#75715e">/* ... */</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">final</span> <span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">Interactive</span><span style="color:#f92672">(</span>bulkLoadPortion<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Double</span><span style="color:#f92672">)</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Mode</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Layout</span> <span style="color:#f92672">=</span> <span style="color:#a6e22e">DataFrame</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#75715e">/* ... */</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">final</span> <span style="color:#66d9ef">case</span> <span style="color:#66d9ef">class</span> <span style="color:#a6e22e">BI</span><span style="color:#f92672">(</span>bulkloadPortion<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Double</span><span style="color:#f92672">,</span> batchPeriod<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">String</span><span style="color:#f92672">)</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Mode</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Layout</span> <span style="color:#f92672">=</span> <span style="color:#a6e22e">BatchedEntity</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#75715e">/* ... */</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span></code></pre></div><p>You may notice that <code>Transform</code> is statically typed w.r.t. <code>Mode</code>, however other properties, like <code>isAttrExploded</code>, or <code>isEdgesExploded</code> are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.</p>
+<p>As we already mentioned, <code>Graph</code> is essentially a persistent container of <code>EntityType -&gt; DataFrame</code> mappings. <code>EntityType</code> can be <code>Node</code>, <code>Edge</code> and <code>Attr</code>, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.</p>
+<p>Usually, a graph transformation involves matching entities based on their <code>EntityType</code>, and modifying the mapping (and if required, other metadata). Take, for example, the <code>ExplodeAttrs</code> transformation, which explodes into separate tables the values of two columns of <code>Person</code> stored as arrays:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">object</span> <span style="color:#a6e22e">ExplodeAttrs</span> <span style="color:#66d9ef">extends</span> <span style="color:#a6e22e">Transform</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span>, <span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">override</span> <span style="color:#66d9ef">def</span> transform<span style="color:#f92672">(</span>input<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">In</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Out</span> <span style="color:#f92672">=</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">if</span> <span style="color:#f92672">(</span>input<span style="color:#f92672">.</span>definition<span style="color:#f92672">.</span>isAttrExploded<span style="color:#f92672">)</span> <span style="color:#f92672">{</span>                              <span style="color:#75715e">// assert at runtime that the transformation hasn&#39;t been applied yet
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>      <span style="color:#66d9ef">throw</span> <span style="color:#66d9ef">new</span> <span style="color:#a6e22e">AssertionError</span><span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Attributes already exploded in the input graph&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">def</span> explodedAttr<span style="color:#f92672">(</span>attr<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Attr</span><span style="color:#f92672">,</span> node<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">DataFrame</span><span style="color:#f92672">,</span> column<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Column</span><span style="color:#f92672">)</span> <span style="color:#66d9ef">=</span>
+</span></span><span style="display:flex;"><span>      attr <span style="color:#f92672">-&gt;</span> node<span style="color:#f92672">.</span>select<span style="color:#f92672">(</span>withRawColumns<span style="color:#f92672">(</span>attr<span style="color:#f92672">,</span> $<span style="color:#e6db74">&#34;id&#34;</span><span style="color:#f92672">.</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">s&#34;</span><span style="color:#e6db74">${</span>attr<span style="color:#f92672">.</span>parent<span style="color:#e6db74">}</span><span style="color:#e6db74">Id&#34;</span><span style="color:#f92672">),</span> explode<span style="color:#f92672">(</span>split<span style="color:#f92672">(</span>column<span style="color:#f92672">,</span> <span style="color:#e6db74">&#34;;&#34;</span><span style="color:#f92672">)).</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">s&#34;</span><span style="color:#e6db74">${</span>attr<span style="color:#f92672">.</span>attribute<span style="color:#e6db74">}</span><span style="color:#e6db74">Id&#34;</span><span style="color:#f92672">)))</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">val</span> modifiedEntities <span style="color:#66d9ef">=</span> input<span style="color:#f92672">.</span>entities
+</span></span><span style="display:flex;"><span>      <span style="color:#f92672">.</span>collect <span style="color:#f92672">{</span> <span style="color:#66d9ef">case</span> <span style="color:#f92672">(</span>k <span style="color:#66d9ef">@</span> <span style="color:#a6e22e">Node</span><span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Person&#34;</span><span style="color:#f92672">,</span> <span style="color:#66d9ef">false</span><span style="color:#f92672">),</span> df<span style="color:#f92672">)</span> <span style="color:#66d9ef">=&gt;</span>                <span style="color:#75715e">// match the Person node. This is the only one ExplodeAttrs should modify
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>        <span style="color:#a6e22e">Map</span><span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>          explodedAttr<span style="color:#f92672">(</span><span style="color:#a6e22e">Attr</span><span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Email&#34;</span><span style="color:#f92672">,</span> k<span style="color:#f92672">,</span> <span style="color:#e6db74">&#34;EmailAddress&#34;</span><span style="color:#f92672">),</span> df<span style="color:#f92672">,</span> $<span style="color:#e6db74">&#34;email&#34;</span><span style="color:#f92672">),</span> <span style="color:#75715e">// add a new &#34;PersonEmailEmailAddress&#34; entity derived by exploding the email column of Person
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>          explodedAttr<span style="color:#f92672">(</span><span style="color:#a6e22e">Attr</span><span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Speaks&#34;</span><span style="color:#f92672">,</span> k<span style="color:#f92672">,</span> <span style="color:#e6db74">&#34;Language&#34;</span><span style="color:#f92672">),</span> df<span style="color:#f92672">,</span> $<span style="color:#e6db74">&#34;language&#34;</span><span style="color:#f92672">),</span> <span style="color:#75715e">// add a new &#34;PersonSpeaksLanguage&#34; entity derived by exploding the language column of Person
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>          k <span style="color:#f92672">-&gt;</span> df<span style="color:#f92672">.</span>drop<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;email&#34;</span><span style="color:#f92672">,</span> <span style="color:#e6db74">&#34;language&#34;</span><span style="color:#f92672">)</span>                             <span style="color:#75715e">// drop the exploded columns from person
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>        <span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>      <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">val</span> updatedEntities <span style="color:#66d9ef">=</span> modifiedEntities
+</span></span><span style="display:flex;"><span>      <span style="color:#f92672">.</span>foldLeft<span style="color:#f92672">(</span>input<span style="color:#f92672">.</span>entities<span style="color:#f92672">)(</span><span style="color:#66d9ef">_</span> <span style="color:#f92672">++</span> <span style="color:#66d9ef">_</span><span style="color:#f92672">)</span>                                 <span style="color:#75715e">// merge-replace the modified entities in the graph
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">val</span> updatedEntityDefinitions <span style="color:#66d9ef">=</span> modifiedEntities
+</span></span><span style="display:flex;"><span>      <span style="color:#f92672">.</span>foldLeft<span style="color:#f92672">(</span>input<span style="color:#f92672">.</span>definition<span style="color:#f92672">.</span>entities<span style="color:#f92672">)</span> <span style="color:#f92672">{</span> <span style="color:#f92672">(</span>e<span style="color:#f92672">,</span> v<span style="color:#f92672">)</span> <span style="color:#66d9ef">=&gt;</span>
+</span></span><span style="display:flex;"><span>        e <span style="color:#f92672">++</span> v<span style="color:#f92672">.</span>map<span style="color:#f92672">{</span> <span style="color:#66d9ef">case</span> <span style="color:#f92672">(</span>k<span style="color:#f92672">,</span> v<span style="color:#f92672">)</span> <span style="color:#66d9ef">=&gt;</span> k <span style="color:#f92672">-&gt;</span> <span style="color:#a6e22e">Some</span><span style="color:#f92672">(</span>v<span style="color:#f92672">.</span>schema<span style="color:#f92672">.</span>toDDL<span style="color:#f92672">)</span> <span style="color:#f92672">}</span>          <span style="color:#75715e">// update the entity definition schema to reflect the modifications
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>      <span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">val</span> l <span style="color:#66d9ef">=</span> lens<span style="color:#f92672">[</span><span style="color:#66d9ef">In</span><span style="color:#f92672">]</span>                                                    <span style="color:#75715e">// lenses provide a terse syntax for modifying nested fields
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span>
+</span></span><span style="display:flex;"><span>    <span style="color:#f92672">(</span>l<span style="color:#f92672">.</span>definition<span style="color:#f92672">.</span>isAttrExploded <span style="color:#f92672">~</span> l<span style="color:#f92672">.</span>definition<span style="color:#f92672">.</span>entities <span style="color:#f92672">~</span> l<span style="color:#f92672">.</span>entities<span style="color:#f92672">).</span>set<span style="color:#f92672">(</span>input<span style="color:#f92672">)((</span><span style="color:#66d9ef">true</span><span style="color:#f92672">,</span> updatedEntityDefinitions<span style="color:#f92672">,</span> updatedEntities<span style="color:#f92672">))</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">}</span>
+</span></span></code></pre></div><p>Note that <code>EntityType</code> does not hold the dataset&rsquo;s full SQL schema currently, as it&rsquo;s not useful for pattern matching, but can be accessed directly from <code>DataFrame</code> if needed.</p>
+<h1 id="inputoutput">Input/output</h1>
+<p>The <code>Reader</code> and <code>Writer</code> typeclasses are used to read from a <code>Source</code> and write to a <code>Sink</code> respectively, terminating a graph transformation pipeline<br>
+on both ends.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">trait</span> <span style="color:#a6e22e">Reader</span><span style="color:#f92672">[</span><span style="color:#66d9ef">T</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Ret</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">def</span> read<span style="color:#f92672">(</span>self<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">T</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Ret</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">def</span> exists<span style="color:#f92672">(</span>self<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">T</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Boolean</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">trait</span> <span style="color:#a6e22e">Writer</span><span style="color:#f92672">[</span><span style="color:#66d9ef">S</span><span style="color:#f92672">]</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">type</span> <span style="color:#66d9ef">Data</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#66d9ef">def</span> write<span style="color:#f92672">(</span>self<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Data</span><span style="color:#f92672">,</span> sink<span style="color:#66d9ef">:</span> <span style="color:#66d9ef">S</span><span style="color:#f92672">)</span><span style="color:#66d9ef">:</span> <span style="color:#66d9ef">Unit</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">}</span>
+</span></span></code></pre></div><p>There are implementations under <code>ldbc.datagen.io.instances</code> that read a graph from a <code>GraphSource</code> and write to a <code>GraphSink</code>.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.model
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.model.Mode
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.graphs.<span style="color:#f92672">{</span><span style="color:#a6e22e">GraphSource</span><span style="color:#f92672">,</span> <span style="color:#a6e22e">GraphSink</span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.instances._
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// read
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> inputPath <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;path/to/input/graph&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> inputFormat <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;parquet&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> source <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">GraphSource</span><span style="color:#f92672">(</span>model<span style="color:#f92672">.</span>graphs<span style="color:#f92672">.</span><span style="color:#a6e22e">Raw</span><span style="color:#f92672">.</span>graphDef<span style="color:#f92672">,</span> inputPath<span style="color:#f92672">,</span> inputFormat<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> graph <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">Reader</span><span style="color:#f92672">[</span><span style="color:#66d9ef">GraphSource</span>, <span style="color:#66d9ef">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span><span style="color:#f92672">]].</span>read<span style="color:#f92672">(</span>source<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// transform
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> transform <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">ExplodeAttrs</span><span style="color:#f92672">.</span>andThen<span style="color:#f92672">(</span><span style="color:#a6e22e">ExplodeEdges</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> transformedGraph <span style="color:#66d9ef">=</span> transform<span style="color:#f92672">(</span>graph<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// write
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> outputPath <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;path/to/output/graph&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> outputFormat <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;csv&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> sink <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">GraphSink</span><span style="color:#f92672">(</span>outputPath<span style="color:#f92672">,</span> outputFormat<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">Writer</span><span style="color:#f92672">[</span><span style="color:#66d9ef">GraphSink</span>, <span style="color:#66d9ef">Graph</span><span style="color:#f92672">[</span><span style="color:#66d9ef">Mode.Raw.</span><span style="color:#66d9ef">type</span><span style="color:#f92672">]].</span>write<span style="color:#f92672">(</span>transformedGraph<span style="color:#f92672">,</span> sink<span style="color:#f92672">)</span>
+</span></span></code></pre></div><p>We provide <a href="https://github.com/typelevel/simulacrum">Ops syntax</a> to make it shorter:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.model
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.model.Mode
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.graphs.<span style="color:#f92672">{</span><span style="color:#a6e22e">GraphSource</span><span style="color:#f92672">,</span> <span style="color:#a6e22e">GraphSink</span><span style="color:#f92672">}</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.instances._
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.Reader.ops._
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">import</span> ldbc.snb.datagen.io.Writer.ops._
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// read
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> inputPath <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;path/to/input/graph&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> inputFormat <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;parquet&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> graph <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">GraphSource</span><span style="color:#f92672">(</span>model<span style="color:#f92672">.</span>graphs<span style="color:#f92672">.</span><span style="color:#a6e22e">Raw</span><span style="color:#f92672">.</span>graphDef<span style="color:#f92672">,</span> inputPath<span style="color:#f92672">,</span> inputFormat<span style="color:#f92672">).</span>read
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// transform
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> transformedGraph <span style="color:#66d9ef">=</span> <span style="color:#f92672">???</span> <span style="color:#75715e">/* ... */</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span><span style="color:#75715e">// write
+</span></span></span><span style="display:flex;"><span><span style="color:#75715e"></span><span style="color:#66d9ef">val</span> outputPath <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;path/to/output/graph&#34;</span>
+</span></span><span style="display:flex;"><span><span style="color:#66d9ef">val</span> outputFormat <span style="color:#66d9ef">=</span> <span style="color:#e6db74">&#34;csv&#34;</span>
+</span></span><span style="display:flex;"><span>transformedGraph<span style="color:#f92672">.</span>write<span style="color:#f92672">(</span><span style="color:#a6e22e">GraphSink</span><span style="color:#f92672">(</span>outputPath<span style="color:#f92672">,</span> outputFormat<span style="color:#f92672">))</span>
+</span></span></code></pre></div><p>The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.</p>
+<p>Spark has a facility to derive SparkSQL schema from case classes automatically<sup id="fnref:2"><a href="#fn:2" class="footnote-ref" role="doc-noteref">2</a></sup>. We created case classes for each entity in the <code>Raw</code> dataset.  We also created a typeclass <code>EntityTraits</code> associating these classes with their <code>EntityType</code>, so we can summon them (and consequently their SparkSQL schema) in the reader.</p>
+<p>The case classes are used during the serialization of the generated dataset too, but more about that later.</p>
+<h1 id="factor-generation">Factor generation</h1>
+<p>As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.</p>
+<p>We decided it&rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use <a href="https://spark.apache.org/graphx/">GraphX</a>, which was unimaginable with the previous design.</p>
+<p>Factor tables are added by extending a map with a <code>name -&gt; Factor</code> pair. <code>Factor</code> declares is input entities, and accepts a function that receives input <code>DataFrames</code>, and returns a single <code>DataFrame</code> as output.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-scala" data-lang="scala"><span style="display:flex;"><span><span style="color:#66d9ef">val</span> factors <span style="color:#66d9ef">=</span> <span style="color:#a6e22e">Map</span> <span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;personDisjointEmployerPairs&#34;</span> <span style="color:#f92672">-&gt;</span> <span style="color:#a6e22e">Factor</span><span style="color:#f92672">(</span><span style="color:#a6e22e">PersonType</span><span style="color:#f92672">,</span> <span style="color:#a6e22e">PersonKnowsPersonType</span><span style="color:#f92672">,</span> <span style="color:#a6e22e">OrganisationType</span><span style="color:#f92672">,</span> <span style="color:#a6e22e">PersonWorkAtCompanyType</span><span style="color:#f92672">)</span> <span style="color:#f92672">{</span>
+</span></span><span style="display:flex;"><span>    <span style="color:#66d9ef">case</span> <span style="color:#a6e22e">Seq</span><span style="color:#f92672">(</span>person<span style="color:#f92672">,</span> personKnowsPerson<span style="color:#f92672">,</span> organisation<span style="color:#f92672">,</span> workAt<span style="color:#f92672">)</span> <span style="color:#66d9ef">=&gt;</span>
+</span></span><span style="display:flex;"><span>      <span style="color:#66d9ef">val</span> knows <span style="color:#66d9ef">=</span> undirectedKnows<span style="color:#f92672">(</span>personKnowsPerson<span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>
+</span></span><span style="display:flex;"><span>      <span style="color:#66d9ef">val</span> company <span style="color:#66d9ef">=</span> organisation<span style="color:#f92672">.</span>where<span style="color:#f92672">(</span>$<span style="color:#e6db74">&#34;Type&#34;</span> <span style="color:#f92672">===</span> <span style="color:#e6db74">&#34;Company&#34;</span><span style="color:#f92672">).</span>cache<span style="color:#f92672">()</span>
+</span></span><span style="display:flex;"><span>      <span style="color:#66d9ef">val</span> personSample <span style="color:#66d9ef">=</span> person
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>orderBy<span style="color:#f92672">(</span>$<span style="color:#e6db74">&#34;id&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>limit<span style="color:#f92672">(</span><span style="color:#ae81ff">20</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>      personSample
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Person2&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>join<span style="color:#f92672">(</span>knows<span style="color:#f92672">.</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;knows&#34;</span><span style="color:#f92672">),</span> $<span style="color:#e6db74">&#34;knows.person2Id&#34;</span> <span style="color:#f92672">===</span> $<span style="color:#e6db74">&#34;Person2.id&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>join<span style="color:#f92672">(</span>workAt<span style="color:#f92672">.</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;workAt&#34;</span><span style="color:#f92672">),</span> $<span style="color:#e6db74">&#34;workAt.PersonId&#34;</span> <span style="color:#f92672">===</span> $<span style="color:#e6db74">&#34;knows.Person1id&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>join<span style="color:#f92672">(</span>company<span style="color:#f92672">.</span>as<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;Company&#34;</span><span style="color:#f92672">),</span> $<span style="color:#e6db74">&#34;Company.id&#34;</span> <span style="color:#f92672">===</span> $<span style="color:#e6db74">&#34;workAt.CompanyId&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>select<span style="color:#f92672">(</span>
+</span></span><span style="display:flex;"><span>          $<span style="color:#e6db74">&#34;Person2.id&#34;</span><span style="color:#f92672">.</span>alias<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;person2id&#34;</span><span style="color:#f92672">),</span>
+</span></span><span style="display:flex;"><span>          $<span style="color:#e6db74">&#34;Company.name&#34;</span><span style="color:#f92672">.</span>alias<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;companyName&#34;</span><span style="color:#f92672">),</span>
+</span></span><span style="display:flex;"><span>          $<span style="color:#e6db74">&#34;Company.id&#34;</span><span style="color:#f92672">.</span>alias<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;companyId&#34;</span><span style="color:#f92672">),</span>
+</span></span><span style="display:flex;"><span>          $<span style="color:#e6db74">&#34;Person2.creationDate&#34;</span><span style="color:#f92672">.</span>alias<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;person2creationDate&#34;</span><span style="color:#f92672">),</span>
+</span></span><span style="display:flex;"><span>          $<span style="color:#e6db74">&#34;Person2.deletionDate&#34;</span><span style="color:#f92672">.</span>alias<span style="color:#f92672">(</span><span style="color:#e6db74">&#34;person2deletionDate&#34;</span><span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">)</span>
+</span></span><span style="display:flex;"><span>        <span style="color:#f92672">.</span>distinct<span style="color:#f92672">()</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#f92672">},</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#75715e">/* more factors */</span>
+</span></span><span style="display:flex;"><span><span style="color:#f92672">)</span>
+</span></span></code></pre></div><p>As you can see, it&rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. <code>undirectedKnows</code>). Currently, there&rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.</p>
+<h1 id="revamping-the-data-generators-serializer">Revamping the data generator&rsquo;s serializer</h1>
+<p>At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.</p>
+<blockquote>
+<p><a href="https://parquet.apache.org/">Parquet</a> is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.</p>
+</blockquote>
+<p>The new serialization framework is heavily influenced by the design of Java <code>OutputStreams</code>, in the sense that stateful objects are composed to form a pipeline. For example, in case of <em>activities</em>, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).</p>
+<p><img src="activity.png" alt="Activity serialization pipeline"></p>
+<p>The benefit of this architecture is that only the last component needs to change when we add support for a new output format.</p>
+<p>To support Parquet, we made use of row-level serializers available in Hadoop&rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the <code>Raw</code> entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. <code>Forum</code>) and Spark&rsquo;s <code>Encoder</code> framework to encode the entities in Parquet, which means that the generated output remains consistent with <code>DataFrame</code>-based reader, and we spare a lot of code duplication.</p>
+<h1 id="optimizations">Optimizations</h1>
+<p>After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks<sup id="fnref:3"><a href="#fn:3" class="footnote-ref" role="doc-noteref">3</a></sup> per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation<sup id="fnref:4"><a href="#fn:4" class="footnote-ref" role="doc-noteref">4</a></sup>. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>./tools/emr/submit_datagen_job.py sf3k_bi <span style="color:#ae81ff">3000</span> parquet bi <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --sf-per-executor <span style="color:#ae81ff">3000</span> <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --partitions <span style="color:#ae81ff">330</span> <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --jar $JAR_NAME <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --instance-type i3.4xlarge <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --bucket $BUCKET_NAME <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  -- --explode-edges --explode-attrs
+</span></span></code></pre></div><div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>./tools/emr/submit_datagen_job.py sf10k_bi <span style="color:#ae81ff">10000</span> parquet bi <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --sf-per-executor <span style="color:#ae81ff">3000</span> <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --partitions <span style="color:#ae81ff">1000</span> <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --jar $JAR_NAME <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --instance-type i3.4xlarge <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  --bucket $BUCKET_NAME <span style="color:#ae81ff">\
+</span></span></span><span style="display:flex;"><span><span style="color:#ae81ff"></span>  -- --explode-edges --explode-attrs
+</span></span></code></pre></div><p>The above examples working configurations for generating the 3K and 10K BI datasets. The <code>--sf-per-executor</code> option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The <code>--partitions</code> option controls the total number of partitions, and was calculated based on the number of persons using the formula <code>partitions = ceil(number_of_persons / block_size / 3)</code> to get a maximum of 3 blocks per partition.</p>
+<h1 id="conclusion">Conclusion</h1>
+<p>These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.</p>
+<h1 id="footnotes">Footnotes</h1>
+<div class="footnotes" role="doc-endnotes">
+<hr>
+<ol>
+<li id="fn:1">
+<p>The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&#160;<a href="#fnref:1" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:2">
+<p>Shameless plug: You can learn more on this from <a href="https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/">another blogpost of mine</a>.&#160;<a href="#fnref:2" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:3">
+<p>The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&#160;<a href="#fnref:3" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:4">
+<p>The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&#160;<a href="#fnref:4" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+</ol>
+</div>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/ldbc-snb-early-2023-updates/index.html b/post/ldbc-snb-early-2023-updates/index.html
new file mode 100644
index 00000000..e1f98605
--- /dev/null
+++ b/post/ldbc-snb-early-2023-updates/index.html
@@ -0,0 +1,480 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC SNB – Early 2023 updates</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">LDBC SNB – Early 2023 updates</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">LDBC SNB – Early 2023 updates</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-color"><a href="https://www.linkedin.com/in/szarnyasg/">Gábor Szárnyas</a></strong> / on <strong class="text-dark">15 Feb 2023</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network Benchmark</a> (<a href="https://www.youtube.com/watch?v=YNF6z6gtXY4">YouTube mirror</a>).</p>
+</li>
+<li>
+<p>I gave a lightning talk at FOSDEM&rsquo;s HPC developer room titled <a href="https://www.youtube.com/watch?v=q26DHnQFw54">The LDBC Benchmark Suite</a> (<a href="https://www.youtube.com/watch?v=q26DHnQFw54">YouTube mirror</a>).</p>
+</li>
+<li>
+<p>Our auditors have successfully benchmark a number of systems:</p>
+<ul>
+<li>SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)</li>
+<li>SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)</li>
+<li>SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)</li>
+</ul>
+</li>
+</ol>
+<p>The results and the full disclosure reports are available under the <a href="/benchmarks/spb/">SPB</a> and <a href="/benchmarks/snb/">SNB benchmark pages</a>.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/making-it-interactive/index.html b/post/making-it-interactive/index.html
new file mode 100644
index 00000000..ab49280d
--- /dev/null
+++ b/post/making-it-interactive/index.html
@@ -0,0 +1,501 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Making It Interactive</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Making It Interactive</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Making It Interactive</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.</p>
+<p>As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.</p>
+<p>Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.</p>
+<p>So, LDBC SNB has a twofold task:</p>
+<ol>
+<li>In order to be a credible interactive workload, it must in fact have characteristics of one</li>
+<li>In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.</li>
+</ol>
+<p>Designing a workload presents specific challenges:</p>
+<ol>
+<li>The workload must be realistic enough for users to identify with it.</li>
+<li>The workload must pose challenges and drive innovation in a useful direction.</li>
+<li>The component operations must all play a noticeable role in it.  If the operation&rsquo;s relative performance doe does not affect the score, why is it in the workload?</li>
+</ol>
+<p>The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.</p>
+<p>Very roughly, the choke points (technical challenges) of SNB interactive are as follows:</p>
+<ul>
+<li>Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.</li>
+<li>Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.</li>
+<li>When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.</li>
+<li>Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.</li>
+</ul>
+<p>Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.</p>
+<p>In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.</p>
+<p>A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.</p>
+<p>The other aspect is the metric, typically some variation on operations per unit of time.</p>
+<p>All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.</p>
+<p>So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.</p>
+<p>But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.</p>
+<p>Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:</p>
+<ul>
+<li>Short queries should collectively be about 45% of the CPU load.</li>
+<li>Updates will be under 5%</li>
+<li>Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.</li>
+</ul>
+<p>The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.</p>
+<p>There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.</p>
+<p>In the next post we will look at the actual mix and execution times on the test system.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/benchmarking">BENCHMARKING</a>
+            , <a href="/tags/tpc">TPC</a>
+            , <a href="/tags/sparql">SPARQL</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/making-semantic-publishing-execution-rules/index.html b/post/making-semantic-publishing-execution-rules/index.html
new file mode 100644
index 00000000..5d27574b
--- /dev/null
+++ b/post/making-semantic-publishing-execution-rules/index.html
@@ -0,0 +1,564 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Making Semantic Publishing Execution Rules</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Making Semantic Publishing Execution Rules</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Making Semantic Publishing Execution Rules</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">18 Nov 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.</p>
+<p>SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:</p>
+<ul>
+<li>
+<p>Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.</p>
+</li>
+<li>
+<p>Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.</p>
+</li>
+</ul>
+<p>These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.</p>
+<p>Another guiding factor of SPB was the BBC&rsquo;s and others&rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.</p>
+<p>Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:</p>
+<ul>
+<li>
+<p>Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.</p>
+</li>
+<li>
+<p>Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.</p>
+</li>
+<li>
+<p>Analytics - These cover a large fraction of the dataset and are roughly linear to data size.</p>
+</li>
+</ul>
+<p>A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.</p>
+<p>The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:</p>
+<ul>
+<li>
+<p>46886 MB of RDF literal text</p>
+</li>
+<li>
+<p>23924 MB of full text index for RDF literals</p>
+</li>
+<li>
+<p>23598 MB of URI strings</p>
+</li>
+<li>
+<p>21981 MB of quads, stored column-wise with default index scheme</p>
+</li>
+</ul>
+<p>Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.</p>
+<p>Let&rsquo;s now look at a full run at unit scale, i.e. 50M triples.</p>
+<p>The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.</p>
+<p>The interactive driver reports:</p>
+<pre tabindex="0"><code>Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+</code></pre><p>The analytical driver reports:</p>
+<pre tabindex="0"><code>Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+</code></pre><p>The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)</p>
+<p>The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (<a href="https://github.com/v7fasttrack/virtuoso-opensource/">v7fasttrack at github.com</a>, <a href="https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics">feature/analytics</a>).</p>
+<p>The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.</p>
+<p>Is this good or bad? I would say that this is possible but better can certainly be accomplished.</p>
+<p>The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.</p>
+<p>As an initial comment of the workload mix, I&rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.</p>
+<p>Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.</p>
+<p>In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/spb">SPB</a>
+            , <a href="/tags/test-run">TEST RUN</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/new-website-online-ldbc-benchmarks-reach-public-draft/index.html b/post/new-website-online-ldbc-benchmarks-reach-public-draft/index.html
new file mode 100644
index 00000000..816d484a
--- /dev/null
+++ b/post/new-website-online-ldbc-benchmarks-reach-public-draft/index.html
@@ -0,0 +1,463 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">New Website Online LDBC Benchmarks Reach Public Draft</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">New Website Online LDBC Benchmarks Reach Public Draft</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">LDBC</strong> / on <strong class="text-dark">14 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.</p>
+<p>The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth <a href="/event/fifth-tuc-meeting">Technical User Community meeting</a>. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.</p>
+<p>You can also see that we created a this new website and a new logo. This website is different from <code>http://ldbc.eu</code> that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.</p>
+<p>In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/developer">DEVELOPER</a>
+            , <a href="/tags/industry">INDUSTRY</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/owl-empowered-sparql-query-optimization/LDBC_D4.4.2_final.pdf b/post/owl-empowered-sparql-query-optimization/LDBC_D4.4.2_final.pdf
new file mode 100644
index 00000000..e6bac7be
Binary files /dev/null and b/post/owl-empowered-sparql-query-optimization/LDBC_D4.4.2_final.pdf differ
diff --git a/post/owl-empowered-sparql-query-optimization/index.html b/post/owl-empowered-sparql-query-optimization/index.html
new file mode 100644
index 00000000..291c7966
--- /dev/null
+++ b/post/owl-empowered-sparql-query-optimization/index.html
@@ -0,0 +1,496 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>OWL Empowered SPARQL Query Optimization</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">OWL-Empowered SPARQL Query Optimization</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">OWL-Empowered SPARQL Query Optimization</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Irini Fundulaki, Giorgos Flouris</strong> / on <strong class="text-dark">18 Feb 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.</p>
+<p>In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.</p>
+<p>OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.</p>
+<p>This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.</p>
+<p>The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found <a href="LDBC_D4.4.2_final.pdf">here</a>.</p>
+<h3 id="schema-based-optimization-techniques">Schema-Based Optimization Techniques</h3>
+<p>Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.</p>
+<p>A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class <code>&lt;A&gt;</code> which are fillers of a specific property <code>&lt;P&gt;</code>. If the underlying schema contains the information that the range of <code>&lt;P&gt;</code> is class <code>&lt;B&gt;</code>, and that class <code>&lt;B&gt;</code> is disjoint from class <code>&lt;A&gt;</code>, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.</p>
+<pre tabindex="0"><code>SELECT ?v 
+WHERE { ?v rdf : type &lt;A&gt; .   
+        ?u &lt;P&gt; ?v . ?u &lt;P&gt; ?v1 .   
+        ?u &lt;P1 &gt; ?v2 . ?u &lt;P2 &gt; ?v3 .   
+        ?u &lt;P3 &gt; ?v4 . ?u &lt;P4 &gt; ?v5}
+</code></pre><p>Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class <code>&lt;A1&gt;</code> can immediately be identified as not being in the answer set.</p>
+<pre tabindex="0"><code>SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &lt;P&gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &lt;A1 &gt; }}
+</code></pre><p>Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.</p>
+<p>Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).</p>
+<p>As an example of these patterns, consider the query below, where class <code>&lt;C&gt;</code> is defined as the intersection of classes <code>&lt;C1&gt;</code>,<code> &lt;C2&gt;</code>. Thus, the triple pattern <code>(?x rdf:type &lt;C&gt;)</code> is more selective than <code>(?y rdf:type &lt;C1&gt;)</code> and <code>(?z rdf:type &lt;C2&gt;)</code> and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.</p>
+<pre tabindex="0"><code>SELECT ?x 
+WHERE { ?x rdf: type &lt;C&gt; . ?x &lt;P1 &gt; ?y . 
+        ?y rdf : type &lt;C1 &gt; . ?y &lt;P2 &gt; ?z . ?z rdf : type &lt;C2 &gt; }
+</code></pre><p><img src="owl_constraints.png" alt="image"></p>
+<p>Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property <code>P4</code> is a symmetric property.</p>
+<pre tabindex="0"><code>SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &lt;P1 &gt; ?y . ?x &lt;P2 &gt; ?y1 . 
+        ?x &lt;P3 &gt; ?y2 . ?y3 &lt;P4 &gt; ?x }
+</code></pre><h3 id="conclusion">Conclusion</h3>
+<p>In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:</p>
+<ul>
+<li>Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.</li>
+<li>Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.</li>
+<li>Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.</li>
+<li>Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.</li>
+</ul>
+<p>This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/developer">DEVELOPER</a>
+            , <a href="/tags/industry">INDUSTRY</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/owl-empowered-sparql-query-optimization/owl_constraints.png b/post/owl-empowered-sparql-query-optimization/owl_constraints.png
new file mode 100644
index 00000000..4e093caf
Binary files /dev/null and b/post/owl-empowered-sparql-query-optimization/owl_constraints.png differ
diff --git a/post/page/1/index.html b/post/page/1/index.html
new file mode 100644
index 00000000..ed50f80c
--- /dev/null
+++ b/post/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/post/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/post/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/post/">
+  </head>
+</html>
diff --git a/post/page/2/index.html b/post/page/2/index.html
new file mode 100644
index 00000000..267cb49a
--- /dev/null
+++ b/post/page/2/index.html
@@ -0,0 +1,809 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/3/index.html b/post/page/3/index.html
new file mode 100644
index 00000000..5d761e78
--- /dev/null
+++ b/post/page/3/index.html
@@ -0,0 +1,793 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/4/index.html b/post/page/4/index.html
new file mode 100644
index 00000000..5f64b7ba
--- /dev/null
+++ b/post/page/4/index.html
@@ -0,0 +1,770 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/5/index.html b/post/page/5/index.html
new file mode 100644
index 00000000..ff0ba75a
--- /dev/null
+++ b/post/page/5/index.html
@@ -0,0 +1,765 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                        
+                      
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                    
+                  
+                  
+                  
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/6/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/6/index.html b/post/page/6/index.html
new file mode 100644
index 00000000..5b6765b5
--- /dev/null
+++ b/post/page/6/index.html
@@ -0,0 +1,777 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/5/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/7/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/7/index.html b/post/page/7/index.html
new file mode 100644
index 00000000..08000ceb
--- /dev/null
+++ b/post/page/7/index.html
@@ -0,0 +1,795 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/6/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/8/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/page/8/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/page/8/index.html b/post/page/8/index.html
new file mode 100644
index 00000000..5c1c8a04
--- /dev/null
+++ b/post/page/8/index.html
@@ -0,0 +1,686 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Posts</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Posts</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Posts</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-1 order-lg-1">
+        <div class="row">
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/post/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/post/page/7/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/6/" class="page-link hover-ripple">
+                        6
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/post/page/7/" class="page-link hover-ripple">
+                        7
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                    
+                    
+                      
+                      
+                        
+                      
+                    
+                    
+                  
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/post/page/8/" class="page-link hover-ripple">
+                        8
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/person-activity-subgraph-features-in-ldbc-datagen/1.png b/post/person-activity-subgraph-features-in-ldbc-datagen/1.png
new file mode 100644
index 00000000..701cdca7
Binary files /dev/null and b/post/person-activity-subgraph-features-in-ldbc-datagen/1.png differ
diff --git a/post/person-activity-subgraph-features-in-ldbc-datagen/index.html b/post/person-activity-subgraph-features-in-ldbc-datagen/index.html
new file mode 100644
index 00000000..9b754af2
--- /dev/null
+++ b/post/person-activity-subgraph-features-in-ldbc-datagen/index.html
@@ -0,0 +1,472 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Person Activity Subgraph Features in LDBC DATAGEN</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Person Activity Subgraph Features in LDBC DATAGEN</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">04 Feb 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.</p>
+<p>When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.</p>
+<h3 id="reaslistic-message-content">Reaslistic Message Content</h3>
+<p>Messages&rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&rsquo;s tags to other related or randomly selected tags.</p>
+<h3 id="non-uniform-activity-levels">Non uniform activity levels</h3>
+<p>In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.</p>
+<h3 id="time-correlated-post-and-comment-generation">Time correlated post and comment generation</h3>
+<p>In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in <a href="#references">[1]</a>. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.</p>
+<p><img src="1.png" alt="image"></p>
+<p>As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.</p>
+<p>In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.</p>
+<h4 id="references">References</h4>
+<p>[1] Leskovec, J., Backstrom, L., &amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In <em>Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining</em> (pp. 497-506). ACM.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/datagen">DATAGEN</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/record-breaking-snb-interactive-results-for-graphscope/index.html b/post/record-breaking-snb-interactive-results-for-graphscope/index.html
new file mode 100644
index 00000000..49581563
--- /dev/null
+++ b/post/record-breaking-snb-interactive-results-for-graphscope/index.html
@@ -0,0 +1,469 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Record Breaking SNB Interactive Results for GraphScope</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Record-Breaking SNB Interactive Results for GraphScope</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Record-Breaking SNB Interactive Results for GraphScope</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Gábor Szárnyas</strong> / on <strong class="text-dark">26 May 2024</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s</li>
+</ul>
+<p>The audit was commissioned by the <a href="https://www.alibabacloud.com/">Alibaba Cloud</a> and was conducted by <a href="https://www.linkedin.com/in/arnau-prat-a70283bb/">Dr. Arnau Prat-Pérez</a>, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&rsquo;s infrastructure. The <a href="/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf">executive summary</a>, <a href="/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf">full disclosure report</a>, and <a href="%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)">supplementary package</a> describe the benchmark&rsquo;s steps and include instructions for reproduction.</p>
+<p>LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.</p>
+<div align="center"><img src="/images/graphscope.svg" width="200"></div>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/benchmark">BENCHMARK</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/01-Sesame-repo-list.png b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/01-Sesame-repo-list.png
new file mode 100644
index 00000000..f63524fa
Binary files /dev/null and b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/01-Sesame-repo-list.png differ
diff --git a/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/02-Sesame-create-repo.png b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/02-Sesame-create-repo.png
new file mode 100644
index 00000000..ec70cd37
Binary files /dev/null and b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/02-Sesame-create-repo.png differ
diff --git a/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/index.html b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/index.html
new file mode 100644
index 00000000..b2609a3f
--- /dev/null
+++ b/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/index.html
@@ -0,0 +1,599 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Iliya Enchev</strong> / on <strong class="text-dark">13 Jan 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install of <a href="http://releases.ubuntu.com/14.04.1/">Ubuntu Server 14.04.1</a>. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.</p>
+<h3 id="prerequisites">Prerequisites</h3>
+<p>We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:</p>
+<ul>
+<li>Git</li>
+<li>Apache Ant 1.8 or higher</li>
+<li>OpenJDK 6 or Oracle JDK 6 or higher</li>
+<li>Apache Tomcat 7 or higher</li>
+</ul>
+<p>If you already have these components installed on your machine you can directly proceed to the next section: <em>Installing Sesame</em></p>
+<p>Following are sample commands which can be used to install the required software components:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>sudo apt-get install git
+</span></span><span style="display:flex;"><span>sudo apt-get install ant
+</span></span><span style="display:flex;"><span>sudo apt-get install default-jdk
+</span></span><span style="display:flex;"><span>sudo apt-get install tomcat7
+</span></span></code></pre></div><p>Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.</p>
+<p>After a successful installation of Apache Tomcat you should be able to get the default splash page <em>“It works”</em> when you open your web browser and enter the following address:  http://&lt;your_ip_address&gt;:8080</p>
+<h3 id="installing-sesame">Installing Sesame</h3>
+<p>We will use current Sesame version 2.7.14. You can download it <a href="http://sourceforge.net/projects/sesame/files/Sesame%202/">here</a> or run following command:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>wget <span style="color:#ae81ff">\\</span>
+</span></span><span style="display:flex;"><span>  <span style="color:#e6db74">&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&#34;</span> <span style="color:#ae81ff">\\</span>
+</span></span><span style="display:flex;"><span>  -O openrdf-sesame-2.7.14-sdk.tar.gz
+</span></span></code></pre></div><p>Then extract the Sesame tarball:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+</span></span></code></pre></div><p>To deploy sesame you have to copy the two war files that are in <em>openrdf-sesame-2.7.14/war</em> to <em>/var/lib/tomcat7/webapps</em></p>
+<p>From <em>openrdf-sesame-2.7.14/war</em> you can do it with command:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>cp openrdf-*.war &lt;tomcat_install&gt;/webapps
+</span></span></code></pre></div><p>Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.</p>
+<p>By default the configuration directory is: <em>/usr/share/tomcat7/.aduna</em></p>
+<p>Create the directory:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>sudo mkdir /usr/share/tomcat7/.aduna
+</span></span></code></pre></div><p>Then change the ownership:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>sudo chown tomcat7 /usr/share/tomcat7/.aduna
+</span></span></code></pre></div><p>And finally you should give the necessary permissions:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>sudo chmod o+rwx /usr/share/tomcat7/.aduna
+</span></span></code></pre></div><p>Now when you go to: http://&lt;your_ip_address&gt;:8080/openrdf-workbench/repositories</p>
+<p>You should get a screen like this:</p>
+<p><img src="01-Sesame-repo-list.png" alt="image"></p>
+<h3 id="setup-spb">Setup SPB</h3>
+<p>You can download the SPB code and find brief documentation on GitHub:</p>
+<p><a href="https://github.com/ldbc/ldbc_spb_bm">https://github.com/ldbc/ldbc_spb_bm</a></p>
+<p>A detailed documentation is located here:</p>
+<p><a href="https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf">https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf</a></p>
+<p>SPB offers many configuration options which control various features of the benchmark e.g.:</p>
+<ul>
+<li>query mixes</li>
+<li>dataset size</li>
+<li>loading datasets</li>
+<li>number of agents</li>
+<li>validating results</li>
+<li>test conformance to OWL2-RL ruleset</li>
+<li>update rate of agents</li>
+</ul>
+<p>Here we demonstrate how to generate a dataset and execute a simple test<br>
+run with it.</p>
+<p>First download the SPB source code from the repository:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>git clone https://github.com/ldbc/ldbc_spb_bm.git
+</span></span></code></pre></div><p>Then in the ldbc_spb_bm directory build the project:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>ant build-basic-querymix
+</span></span></code></pre></div><p>If you simply execute the command:</p>
+<pre tabindex="0"><code>ant
+</code></pre><p>you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.</p>
+<p>Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&rsquo;s startup files e.g. in <em>catalina.sh</em>:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>export JAVA_OPTS<span style="color:#f92672">=</span><span style="color:#e6db74">&#34;-d64 -Xmx4G&#34;</span>
+</span></span></code></pre></div><p>To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:</p>
+<p><img src="02-Sesame-create-repo.png" alt="image"></p>
+<p>Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in <em>ldbc_spb_bm/dist/test.properties</em> file.</p>
+<p>The default value of <em>datasetSize</em> in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.</p>
+<p>You need to change</p>
+<pre tabindex="0"><code>datasetSize=1000000
+</code></pre><p>Also the URLs of the SPARQL endpoint for the repository</p>
+<pre tabindex="0"><code>endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+</code></pre><p>First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.</p>
+<p>These are the settings to do that, following parameters will &lsquo;instruct&rsquo; the SPB test driver to perform all the actions described above:</p>
+<pre tabindex="0"><code>#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+</code></pre><p>To run the benchmark execute the following:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>java -jar semantic_publishing_benchmark-basic-standard.jar
+</span></span><span style="display:flex;"><span>test.properties
+</span></span></code></pre></div><p>When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.</p>
+<p>Next we will measure the performance of Sesame Data Store by changing some configuration properties:</p>
+<pre tabindex="0"><code>#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+</code></pre><p>After the benchmark test run has finished result files are saved in folder: <em>dist/logs</em></p>
+<p>There you will find three types of results: the result summary of the benchmark run (<em>semantic_publishing_benchmark_results.log),</em> brief results and detailed results.</p>
+<p>In <em>semantic_publishing_benchmark_results.log</em> you will find the results distributed per seconds. They should be similar to the listing bellow:</p>
+<p>Benchmark Results for the 300-th second</p>
+<pre tabindex="0"><code>Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+</code></pre><p>This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.</p>
+<p>If you have any troubles running the benchmark, don&rsquo;t hesitate to comment or use our social media channels.</p>
+<p>In a future post we will go through some of the parameters of SPB and check their performance implications.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/spb">SPB</a>
+            , <a href="/tags/sesame">SESAME</a>
+            , <a href="/tags/rdf">RDF</a>
+            , <a href="/tags/tutorial">TUTORIAL</a>
+            , <a href="/tags/guide">GUIDE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/semantic-publishing-instance-matching-benchmark/index.html b/post/semantic-publishing-instance-matching-benchmark/index.html
new file mode 100644
index 00000000..ab0e7d58
--- /dev/null
+++ b/post/semantic-publishing-instance-matching-benchmark/index.html
@@ -0,0 +1,480 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Semantic Publishing Instance Matching Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Semantic Publishing Instance Matching Benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Semantic Publishing Instance Matching Benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Irini Fundulaki</strong> / on <strong class="text-dark">30 Dec 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:</p>
+<ul>
+<li>value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity</li>
+<li>structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)</li>
+</ul>
+<p>The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:</p>
+<ul>
+<li>instance (in)equality (owl:sameAs, owl:differentFrom)</li>
+<li>class and property equivalence (owl:equivalentClass, owl:equivalentProperty)</li>
+<li>class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)</li>
+<li>class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)</li>
+<li>property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)</li>
+<li>complex class definitions (owl:unionOf, owl:intersectionOf)</li>
+</ul>
+<p>SPIMBench uses and extends the ontologies of LDBC&rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.</p>
+<p>Value and structure-based test cases are implemented using the SWING framework <a href="#references">[1]</a> on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.</p>
+<p>SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.</p>
+<p>SPIMBench can be downloaded from <a href="https://github.com/jsaveta/SPIMBench">our repository</a> and a more thorough description thereof can be found on <a href="http://www.ics.forth.gr/isl/spimbench/">http://www.ics.forth.gr/isl/spimbench/</a>.</p>
+<h4 id="references">References</h4>
+<p>[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/instance-matching">INSTANCE MATCHING</a>
+            , <a href="/tags/benchmark">BENCHMARK</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/index.html b/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/index.html
new file mode 100644
index 00000000..bfc1b353
--- /dev/null
+++ b/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/index.html
@@ -0,0 +1,739 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Sizing AWS Instances for the Semantic Publishing Benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Sizing AWS Instances for the Semantic Publishing Benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Iliya Enchev. Venelin Kotsev</strong> / on <strong class="text-dark">17 Dec 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">wrote earlier</a>, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.</p>
+<p>Lately we tested different Amazon Web Services (<a href="https://aws.amazon.com/">AWS</a>) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that <a href="https://www.ontotext.com/products/ontotext-graphdb/">GraphDB</a> experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.</p>
+<h3 id="the-experiment">The Experiment</h3>
+<p>For our tests we use:</p>
+<ul>
+<li>GraphDB Standard v6.1</li>
+<li>LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+<ul>
+<li>8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also</li>
+<li>50M dataset (SF1)</li>
+<li>40 minutes of benchmark run time (60 seconds of warm up)</li>
+</ul>
+</li>
+<li>5 different Amazon EC2 instances and one local server</li>
+</ul>
+<p>Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.</p>
+<p>We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.</p>
+<p>We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.</p>
+<h3 id="the-results">The Results</h3>
+<p>For the tests we measured:</p>
+<ul>
+<li><em>queries/s</em> for the read threads, where queries include SELECT and CONSTRUCT</li>
+<li><em>updates/s</em> for the write threads, where an update operation is INSERT or DELETE</li>
+<li><em>queries/$</em> and <em>updates/$</em> – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput</li>
+<li><em>update/vCPU</em> – modification operations per vCPU per second</li>
+</ul>
+<p>Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.</p>
+<p>The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.</p>
+<p>Table 1. SPB Measurement Results on AWS and Local Servers</p>
+<table>
+<thead>
+<tr>
+<th>Server Type</th>
+<th>vCPUs</th>
+<th>R/W Agents</th>
+<th>RAM (GB)</th>
+<th>&ldquo;Storage (GB, SSD)&rdquo;</th>
+<th>Price USD/h</th>
+<th>Queries/ sec.</th>
+<th>Updates/ sec.</th>
+<th>Queries/ USD</th>
+<th>Updates/ USD</th>
+<th>Updates/ vCPU</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>m3.xlarge</td>
+<td>4</td>
+<td>8/2</td>
+<td>15</td>
+<td>2x 40</td>
+<td>0.28</td>
+<td>8.39</td>
+<td>8.23</td>
+<td>107 882</td>
+<td>105 873</td>
+<td>2.06</td>
+</tr>
+<tr>
+<td>m3.2xlarge</td>
+<td>8</td>
+<td>8/2</td>
+<td>30</td>
+<td>2x 80</td>
+<td>0.56</td>
+<td>15.44</td>
+<td>15.67</td>
+<td>99 282</td>
+<td>100 752</td>
+<td>1.96</td>
+</tr>
+<tr>
+<td>c3.xlarge</td>
+<td>4</td>
+<td>8/2</td>
+<td>7.5</td>
+<td>2x 40</td>
+<td>0.21</td>
+<td>7.17</td>
+<td>6.78</td>
+<td>122 890</td>
+<td>116 292</td>
+<td>1.7</td>
+</tr>
+<tr>
+<td><strong>c3.2xlarge</strong></td>
+<td><strong>8</strong></td>
+<td><strong>8/2</strong></td>
+<td><strong>15</strong></td>
+<td><strong>2x 80</strong></td>
+<td><strong>0.42</strong></td>
+<td><strong>16.46</strong></td>
+<td><strong>14.56</strong></td>
+<td><strong>141 107</strong></td>
+<td><strong>124 839</strong></td>
+<td><strong>1.82</strong></td>
+</tr>
+<tr>
+<td><strong>c3.4xlarge</strong></td>
+<td><strong>16</strong></td>
+<td><strong>8/2</strong></td>
+<td><strong>30</strong></td>
+<td><strong>2x 160</strong></td>
+<td><strong>0.84</strong></td>
+<td><strong>23.23</strong></td>
+<td><strong>21.17</strong></td>
+<td><strong>99 578</strong></td>
+<td><strong>90 736</strong></td>
+<td><strong>1.32</strong></td>
+</tr>
+<tr>
+<td>c3.4xlarge</td>
+<td>16</td>
+<td>8/3</td>
+<td>30</td>
+<td>2x 160</td>
+<td>0.84</td>
+<td>22.89</td>
+<td>20.39</td>
+<td>98 100</td>
+<td>87 386</td>
+<td>1.27</td>
+</tr>
+<tr>
+<td>c3.4xlarge</td>
+<td>16</td>
+<td>10/2</td>
+<td>30</td>
+<td>2x 160</td>
+<td>0.84</td>
+<td>26.6</td>
+<td>19.11</td>
+<td>114 000</td>
+<td>81 900</td>
+<td>1.19</td>
+</tr>
+<tr>
+<td>c3.4xlarge</td>
+<td>16</td>
+<td>10/3</td>
+<td>30</td>
+<td>2x 160</td>
+<td>0.84</td>
+<td>26.19</td>
+<td>19.18</td>
+<td>112 243</td>
+<td>82 200</td>
+<td>1.2</td>
+</tr>
+<tr>
+<td><strong>c3.4xlarge</strong></td>
+<td><strong>16</strong></td>
+<td><strong>14/2</strong></td>
+<td><strong>30</strong></td>
+<td><strong>2x 160</strong></td>
+<td><strong>0.84</strong></td>
+<td><strong>30.84</strong></td>
+<td><strong>16.88</strong></td>
+<td><strong>132 171</strong></td>
+<td><strong>72 343</strong></td>
+<td><strong>1.06</strong></td>
+</tr>
+<tr>
+<td>c3.4xlarge</td>
+<td>16</td>
+<td>14/3</td>
+<td>30</td>
+<td>2x 160</td>
+<td>0.84</td>
+<td>29.67</td>
+<td>17.8</td>
+<td>127 157</td>
+<td>76 286</td>
+<td>1.11</td>
+</tr>
+<tr>
+<td>Local</td>
+<td>32</td>
+<td>8/2</td>
+<td>256</td>
+<td>8x 256</td>
+<td>0.85</td>
+<td>37.11</td>
+<td>32.04</td>
+<td>156 712</td>
+<td>135 302</td>
+<td>1</td>
+</tr>
+<tr>
+<td>Local</td>
+<td>32</td>
+<td>8/3</td>
+<td>256</td>
+<td>8x 256</td>
+<td>0.85</td>
+<td>37.31</td>
+<td>32.07</td>
+<td>157 557</td>
+<td>135 429</td>
+<td>1</td>
+</tr>
+<tr>
+<td><strong>Local</strong></td>
+<td><strong>32</strong></td>
+<td><strong>10/2</strong></td>
+<td><strong>256</strong></td>
+<td><strong>8x 256</strong></td>
+<td><strong>0.85</strong></td>
+<td><strong>40</strong></td>
+<td><strong>31.01</strong></td>
+<td><strong>168 916</strong></td>
+<td><strong>130 952</strong></td>
+<td><strong>0.97</strong></td>
+</tr>
+<tr>
+<td>Local</td>
+<td>32</td>
+<td>14/2</td>
+<td>256</td>
+<td>8x 256</td>
+<td>0.85</td>
+<td>36.39</td>
+<td>26.42</td>
+<td>153 672</td>
+<td>111 569</td>
+<td>0.83</td>
+</tr>
+<tr>
+<td>Local</td>
+<td>32</td>
+<td>14/3</td>
+<td>256</td>
+<td>8x 256</td>
+<td>0.85</td>
+<td>36.22</td>
+<td>26.39</td>
+<td>152 954</td>
+<td>111 443</td>
+<td>0.82</td>
+</tr>
+<tr>
+<td>Local</td>
+<td>32</td>
+<td>20/2</td>
+<td>256</td>
+<td>8x 256</td>
+<td>0.85</td>
+<td>34.59</td>
+<td>23.86</td>
+<td>146 070</td>
+<td>100 759</td>
+<td>0.75</td>
+</tr>
+</tbody>
+</table>
+<h3 id="the-optimal-number-of-test-agents">The Optimal Number of Test Agents</h3>
+<p>Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:</p>
+<ul>
+<li>There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;</li>
+<li>Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);</li>
+<li>Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;</li>
+<li>For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;</li>
+<li>Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.</li>
+<li>There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.</li>
+</ul>
+<h3 id="efficiency-and-cost">Efficiency and Cost</h3>
+<p>AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.</p>
+<p>Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.</p>
+<p>$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!</p>
+<p>The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.</p>
+<p>To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:</p>
+<ul>
+<li><strong>100 queries/sec.</strong> handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.</li>
+<li><strong>10 updates/sec.</strong> - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.</li>
+<li><strong>$81/day</strong> is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.</li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/spb">SPB</a>
+            , <a href="/tags/amazon">AMAZON</a>
+            , <a href="/tags/ec2">EC2</a>
+            , <a href="/tags/aws">AWS</a>
+            , <a href="/tags/rdf">RDF</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-and-graphs-related-presentations-at-grades-15/index.html b/post/snb-and-graphs-related-presentations-at-grades-15/index.html
new file mode 100644
index 00000000..8cdfabdf
--- /dev/null
+++ b/post/snb-and-graphs-related-presentations-at-grades-15/index.html
@@ -0,0 +1,467 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB and Graphs Related Presentations at GRADES &#39;15</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB and Graphs Related Presentations at GRADES &#39;15</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Damaris Coll</strong> / on <strong class="text-dark">29 May 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in <a href="https://github.com/ldbc">https://github.com/ldbc</a>) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &ldquo;Microblogging Queries on Graph Databases: an Introspection&rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &ldquo;Frappé: Querying the Linux Kernel Dependency Graph&rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.</p>
+<p><a href="http://event.cwi.nl/grades2015/program.shtml">Check the complete agenda.</a></p>
+<p>Meet you in Melbourne!</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/sigmod">SIGMOD</a>
+            , <a href="/tags/graphalytics">GRAPHALYTICS</a>
+            , <a href="/tags/grades">GRADES</a>
+            , <a href="/tags/snb">SNB</a>
+            , <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/workshop">WORKSHOP</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-data-generator-getting-started/index.html b/post/snb-data-generator-getting-started/index.html
new file mode 100644
index 00000000..953bbfb2
--- /dev/null
+++ b/post/snb-data-generator-getting-started/index.html
@@ -0,0 +1,577 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Data Generator   Getting Started</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Data Generator - Getting Started</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Data Generator - Getting Started</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>$ cd /home/user
+</span></span><span style="display:flex;"><span>$ tar xvfz hadoop-1.2.1.tar.gz
+</span></span></code></pre></div><p>For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the <a href="https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration">LDBC DATAGEN wiki</a>.</p>
+<h3 id="getting-and-configuring-datagen">Getting and configuring DATAGEN</h3>
+<p>Before downloading DATAGEN, be sure to fulfill the following requirements:</p>
+<ul>
+<li>Linux based machine</li>
+<li>java 1.6 or greater</li>
+<li>python 2.7.X</li>
+<li>maven 3</li>
+</ul>
+<p>After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found <a href="https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases">here</a>. Again, decompress the downloaded file with the following commands:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>$ cd /home/user
+</span></span><span style="display:flex;"><span>$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+</span></span></code></pre></div><p>This will create a folder called “ldbc_snb_datagen-0.1.2”.</p>
+<p>DATAGEN provides a <em>run.sh</em> is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>HADOOP_HOME<span style="color:#f92672">=</span>/home/user/hadoop-1.2.1
+</span></span><span style="display:flex;"><span>LDBC_SNB_DATAGEN_HOME<span style="color:#f92672">=</span>/home/user/ldbc_snb_datagen
+</span></span></code></pre></div><p>HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute <em>run.sh</em> script to compile and execute DATAGEN using default parameters. Type the following commands:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-bash" data-lang="bash"><span style="display:flex;"><span>$ cd /home/user/ldbc_snb_datagen-0.1.2
+</span></span><span style="display:flex;"><span>$ ./run.sh
+</span></span></code></pre></div><p>This will run DATAGEN, and two folders will be created at the same directory: <em>social_network</em> containing the scale factor 1 dataset with csv uncompressed files, and <em>substitution_parameters</em> containing the substituion parameters needed by the driver to execute the benchmark.</p>
+<h3 id="changing-the-generated-dataset">Changing the generated dataset</h3>
+<p>The characteristics of the dataset to be generated are specified in the <em>params.ini</em> file. By default, this file has the following content:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-ini" data-lang="ini"><span style="display:flex;"><span><span style="color:#a6e22e">scaleFactor:1</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">compressed:false</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">serializer:csv</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">numThreads:1</span>
+</span></span></code></pre></div><p>The following is the list of options and their default values supported by DATAGEN:</p>
+<table>
+<thead>
+<tr>
+<th>Option</th>
+<th>Default value</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>scaleFactor</td>
+<td>1</td>
+<td>&ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&rdquo;</td>
+</tr>
+<tr>
+<td>serializer</td>
+<td>csv</td>
+<td>&ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&rdquo;</td>
+</tr>
+<tr>
+<td>compressed</td>
+<td>FALSE</td>
+<td>Specifies to compress the output data in gzip.</td>
+</tr>
+<tr>
+<td>outputDir</td>
+<td>./</td>
+<td>Specifies the folder to output the data.</td>
+</tr>
+<tr>
+<td>updateStreams</td>
+<td>FALSE</td>
+<td>&ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&rdquo;</td>
+</tr>
+<tr>
+<td>numThreads</td>
+<td>1</td>
+<td>Sets the number of threads to use. Only works for pseudo-distributed mode</td>
+</tr>
+</tbody>
+</table>
+<p>For instance, a possible <em>params.ini</em> file could be the following:</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-ini" data-lang="ini"><span style="display:flex;"><span><span style="color:#a6e22e">scaleFactor:30</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">serializer:ttl</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">compressed:true</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">updateStreams:false</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">outputDir:/home/user/output</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">numThreads:4</span>
+</span></span></code></pre></div><p>For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):</p>
+<table>
+<thead>
+<tr>
+<th>Option</th>
+<th>Default value</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>numPersons</td>
+<td>-</td>
+<td>The number of persons to generate</td>
+</tr>
+<tr>
+<td>numYears</td>
+<td>-</td>
+<td>The amount of years of activity</td>
+</tr>
+<tr>
+<td>startYear</td>
+<td>-</td>
+<td>The start year of simulation.</td>
+</tr>
+</tbody>
+</table>
+<p>The following is an example of another possible <em>params.ini</em> file</p>
+<div class="highlight"><pre tabindex="0" style="color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;"><code class="language-ini" data-lang="ini"><span style="display:flex;"><span><span style="color:#a6e22e">numPersons:100000</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">numYears:3</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">startYear:2010</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">serializer:csv_merge_foreign</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">compressed:false</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">updateStreams:true</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">outputDir:/home/user/output</span>
+</span></span><span style="display:flex;"><span><span style="color:#a6e22e">numThreads:4</span>
+</span></span></code></pre></div><p>For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at <a href="https://github.com/ldbc/ldbc_snb_datagen_hadoop/">GitHub</a>!</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/snb">SNB</a>
+            , <a href="/tags/social-network">SOCIAL NETWORK</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-driver-part-1/index.html b/post/snb-driver-part-1/index.html
new file mode 100644
index 00000000..df92b161
--- /dev/null
+++ b/post/snb-driver-part-1/index.html
@@ -0,0 +1,467 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Driver   Part 1</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Driver - Part 1</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Driver - Part 1</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Alex Averbuch</strong> / on <strong class="text-dark">27 Nov 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: <a href="https://github.com/ldbc/ldbc_driver/">https://github.com/ldbc/ldbc_driver/</a>. Multiple reference implementations by two vendors are available here: <a href="https://github.com/ldbc/ldbc_snb_implementations">https://github.com/ldbc/ldbc_snb_implementations</a>, and discussion of the schema, data properties, and related content is available here: <a href="https://github.com/ldbc/ldbc_snb_docs">https://github.com/ldbc/ldbc_snb_docs</a>.</p>
+<p>The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.</p>
+<h3 id="problem-description">Problem Description</h3>
+<p>The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.</p>
+<p>Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.</p>
+<p>The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/driver">DRIVER</a>
+            , <a href="/tags/tpc-c">TPC-C</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-driver-part-2-tracking-dependencies-between-queries/index.html b/post/snb-driver-part-2-tracking-dependencies-between-queries/index.html
new file mode 100644
index 00000000..9f238558
--- /dev/null
+++ b/post/snb-driver-part-2-tracking-dependencies-between-queries/index.html
@@ -0,0 +1,603 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Driver   Part 2: Tracking Dependencies Between Queries</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Driver - Part 2: Tracking Dependencies Between Queries</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Driver - Part 2: Tracking Dependencies Between Queries</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Alex Averbuch</strong> / on <strong class="text-dark">23 Jan 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.</p>
+<h3 id="definitions">Definitions</h3>
+<ul>
+<li>
+<p><em>Simulation Time (ST)</em>: notion of time created by data generator. All time stamps in the generated data set are in simulation time</p>
+</li>
+<li>
+<p><em>Real Time (RT)</em>: wall clock time</p>
+</li>
+<li>
+<p><em>Time Compression Ratio</em>: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark</p>
+</li>
+<li>
+<p><em>Operation</em>: read and/or write</p>
+</li>
+<li>
+<p><em>Dependencies</em>: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed</p>
+</li>
+<li>
+<p><em>Dependents</em>: operations in this set are dependent on at least one other operation (in Dependencies) in the workload</p>
+</li>
+<li>
+<p><em>Due Time (DueT)</em>: point in simulation time at which the execution of an operation should be initiated.</p>
+</li>
+<li>
+<p><em>Dependent Time (DepT)</em>: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.</p>
+</li>
+<li>
+<p><em>Safe Time (SafeT)</em>: time duration.</p>
+<ul>
+<li>
+<p>when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them</p>
+</li>
+<li>
+<p>SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents</p>
+</li>
+</ul>
+</li>
+<li>
+<p>​<em>Operation Stream</em>: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)</p>
+</li>
+<li>
+<p><em>Initiated Operations</em>: operations that have started executing but not yet finished</p>
+</li>
+<li>
+<p><em>Local Completion Time (per driver)</em>: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))</p>
+</li>
+<li>
+<p><em>Global Completion Time (GCT)</em>: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​</p>
+</li>
+<li>
+<p><em>Execution Window (Window)</em>: a timespan within which all operations can be safely executed</p>
+<ul>
+<li>
+<p>All operations satisfying window.startTime &lt;= operation.DueT &lt; window.endTime may be executed</p>
+</li>
+<li>
+<p>Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window</p>
+</li>
+<li>
+<p>To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &lt; window.duration &lt;= SafeT</p>
+</li>
+<li>
+<p>Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable</p>
+</li>
+<li>
+<p>Before any operations within a window can start executing it is required that: GCT &gt;= window.startTime - (SafeT - window.duration)</p>
+</li>
+<li>
+<p>All operations within a window must initiate and complete between window start and end times: window.startTime &lt;= operation.initiate &lt; window.endTime and window.startTime &lt;= operation.complete &lt; window.endTime</p>
+</li>
+</ul>
+</li>
+<li>
+<p><em>Dependency Mode</em>: defines dependencies, constraints on operation execution order</p>
+</li>
+<li>
+<p><em>Execution Mode</em>: defines how the runtime should execute operations of a given type</p>
+</li>
+</ul>
+<h3 id="tracking-dependencies">Tracking Dependencies</h3>
+<p>Now, the fun part, making sure dependent operations are executed in the correct order.</p>
+<p>Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).</p>
+<p>Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:</p>
+<ul>
+<li>the set of operations that have started executing but not yet finished.</li>
+</ul>
+<p>Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:</p>
+<ul>
+<li>the set of operations that have started and finished executing.</li>
+</ul>
+<p>Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):</p>
+<ul>
+<li>the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.</li>
+</ul>
+<p>LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:</p>
+<ul>
+<li>
+<p><em>Due Time</em>: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled</p>
+</li>
+<li>
+<p><em>GCT</em>: every operation (from Dependencies) with a Due Time before this point in time has completed execution</p>
+</li>
+</ul>
+<p>However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:</p>
+<ul>
+<li>in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.</li>
+</ul>
+<p>Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.</p>
+<h3 id="scalable-execution-in-the-presence-of-dependencies">Scalable execution in the Presence of Dependencies</h3>
+<p>The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:</p>
+<p>a) make the generated load less &lsquo;bursty&rsquo;</p>
+<p>b) allow the driver to &lsquo;scale&rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.</p>
+<p>In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.</p>
+<p>The reasons this approach is correct are as follows:</p>
+<ul>
+<li>
+<p>Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked</p>
+</li>
+<li>
+<p>The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)</p>
+</li>
+<li>
+<p>A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until</p>
+<p>GCT &gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT</p>
+</li>
+</ul>
+<p>The advantages of such an execution mode are as follows:</p>
+<ul>
+<li>
+<p>As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window</p>
+</li>
+<li>
+<p>Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic</p>
+</li>
+<li>
+<p>Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &lsquo;smoothen&rsquo; the load within a Window.</p>
+</li>
+</ul>
+<p>As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &lsquo;workload resolution&rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &lsquo;bursty&rsquo; part of the event stream.</p>
+<p><img src="window-scheduling.png" alt="image"><br>
+Figure 1. Window scheduling</p>
+<p>This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &lsquo;what happens in the window stays in the window&rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/driver">DRIVER</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-driver-part-2-tracking-dependencies-between-queries/window-scheduling.png b/post/snb-driver-part-2-tracking-dependencies-between-queries/window-scheduling.png
new file mode 100644
index 00000000..745ae6b0
Binary files /dev/null and b/post/snb-driver-part-2-tracking-dependencies-between-queries/window-scheduling.png differ
diff --git a/post/snb-driver-part-3-workload-execution-putting-it-all-together/index.html b/post/snb-driver-part-3-workload-execution-putting-it-all-together/index.html
new file mode 100644
index 00000000..f95145f0
--- /dev/null
+++ b/post/snb-driver-part-3-workload-execution-putting-it-all-together/index.html
@@ -0,0 +1,520 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Driver   Part 3: Workload Execution Putting It All Together</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Driver - Part 3: Workload Execution Putting It All Together</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Driver - Part 3: Workload Execution Putting It All Together</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Alex Averbuch</strong> / on <strong class="text-dark">20 Jan 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.</p>
+<h3 id="dependency-modes">Dependency Modes</h3>
+<p>While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.</p>
+<p>Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:</p>
+<p><strong>• None</strong></p>
+<p>Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)</p>
+<p>– Prior Execution: do nothing – After Execution: do nothing</p>
+<p><strong>• Read Only</strong></p>
+<p>Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)</p>
+<p>Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)</p>
+<p>– Prior Execution: wait for GCT &gt;= operation.DepTime – After Execution: do nothing</p>
+<p><strong>• Write Only</strong></p>
+<p>Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)</p>
+<p>Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)</p>
+<p>– Prior Execution: add operation to Initiated Operations</p>
+<p>– After Execution: remove operation from Initiated Operations, add operation to Completed Operations</p>
+<p><strong>• Read Write</strong></p>
+<p>Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)</p>
+<p>Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)</p>
+<p>– Prior Execution: add operation to Initiated Operations, wait for GCT &lt; operation.DepT</p>
+<p>– After Execution: remove operation from Initiated Operations, add operation to Completed Operations</p>
+<h3 id="execution-modes">Execution Modes</h3>
+<p>Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.</p>
+<p><strong>• Asynchronous</strong>: operations are executed individually, when their Due Time arrives.</p>
+<p>Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.</p>
+<p>– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &gt;= operation.DueT (and GCT &gt;= operation.DepT)</p>
+<p>– Max Concurrent Executions: unbounded</p>
+<p>– Max Execution Time: unbounded</p>
+<p>– Failure: operation execution starts later than: operation.DueT  Tolerated Delay</p>
+<p><strong>• Synchronous</strong>: operations are executed individually, sequentially, in blocking manner.</p>
+<p>Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.</p>
+<p>The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.</p>
+<p>– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler</p>
+<p>– Execute When time &gt;= operation.DueT and previousOperation.completed == true (and GCT &gt;= operation.DepT)</p>
+<p>– Max Concurrent Executions: 1</p>
+<p>– Max Execution Time: nextOperation.DueT - operation.DueT</p>
+<p>– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay</p>
+<p><strong>• Partially Synchronous</strong> (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together</p>
+<p>– Re-scheduling Before Execution: Yes, as long as the following still holds:</p>
+<p>window.startTime &lt;= operation.DueT &lt; window.startTime + window.duration</p>
+<p>Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified</p>
+<p>– Execute When time &gt;= operation.DueT (and GCT &gt;= operation.DepT)</p>
+<p>– Max Concurrent Executions: number of operations within window</p>
+<p>– Max Execution Time: (window.startTime + window.duration) - operation.DueT</p>
+<p>– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration</p>
+<h3 id="tying-it-back-to-ldbc-snb">Tying it back to LDBC SNB</h3>
+<p>The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.</p>
+<p>The LDBC SNB data can in fact be seen as a union of two parts:</p>
+<ol>
+<li>
+<p>Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.</p>
+</li>
+<li>
+<p>User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &ldquo;core&rdquo; part are satisfied (i.e., users don&rsquo;t post things before the profiles are created, etc.).</p>
+</li>
+</ol>
+<p>In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.</p>
+<p>This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.</p>
+<p>On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/driver">DRIVER</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-interactive-part-1-what-is-snb-interactive-really-about/index.html b/post/snb-interactive-part-1-what-is-snb-interactive-really-about/index.html
new file mode 100644
index 00000000..9024baaf
--- /dev/null
+++ b/post/snb-interactive-part-1-what-is-snb-interactive-really-about/index.html
@@ -0,0 +1,492 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Interactive Part 1: What Is SNB Interactive Really About?</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Interactive Part 1: What Is SNB Interactive Really About?</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">14 May 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.</p>
+<p>The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.</p>
+<p>So far, we see that SNB confronts the implementor with choices in the following areas:</p>
+<ul>
+<li>Data model: Relational, RF, property graph?</li>
+<li>Physical model, e.g. row-wise vs. column wise storage</li>
+<li>Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures</li>
+<li>Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers</li>
+<li>Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.</li>
+<li>Parameters vs. literals: Sometimes different parameter values result in different optimal query plans</li>
+<li>Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload</li>
+<li>Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.</li>
+</ul>
+<p>In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.</p>
+<ul>
+<li>Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.</li>
+<li>Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?</li>
+<li>Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &lsquo;fast&rsquo; and &lsquo;slow&rsquo; case of a single query template. How long does one need to run to balance these fluctuations?</li>
+<li>Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.</li>
+<li>Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.</li>
+<li>Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.</li>
+<li>Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?</li>
+<li>Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?</li>
+</ul>
+<p>The following posts will look at the above in light of actual experience.</p>
+<h3 id="snb-interactive-series">SNB Interactive Series</h3>
+<ul>
+<li><a href="/post/snb-interactive-part-1-what-is-snb-interactive-really-about">SNB Interactive, Part 1: What is SNB Interactive Really About?</a></li>
+<li><a href="/post/snb-interactive-part-2-modeling-choices">SNB Interactive, Part 2: Modeling Choices</a></li>
+<li><a href="/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso</a></li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/virtuoso">VIRTUOSO</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-interactive-part-2-modeling-choices/index.html b/post/snb-interactive-part-2-modeling-choices/index.html
new file mode 100644
index 00000000..f9ff7415
--- /dev/null
+++ b/post/snb-interactive-part-2-modeling-choices/index.html
@@ -0,0 +1,477 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Interactive Part 2: Modeling Choices</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Interactive Part 2: Modeling Choices</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Interactive Part 2: Modeling Choices</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">26 May 2015</strong></div>
+        
+        
+          <i>Note: this post is a continuation of &#34;SNB Interactive Part 1: What is SNB Interactive Really About?&#34; post by Orri Erling.</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.</p>
+<h3 id="schema-design">Schema Design</h3>
+<p>SNB has a regular schema described by a <a href="https://en.wikipedia.org/wiki/Unified_Modeling_Language">UML</a> diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.</p>
+<p>The only table-level choice has to do with whether <code>posts</code> and <code>comments</code> are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.</p>
+<p>The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key <code>of ps_creatorid</code>, <code>ps_creationdate</code>, <code>ps_postid</code> pays off since the top-k on <code>creationdate</code> can be pushed down into the index without needing a reference to the table.</p>
+<p>The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the <a href="http://dbpedia.org/resource/DEX_(Graph_database)">Sparksee</a> and <a href="http://dbpedia.org/resource/Neo4j">Neo4J</a> implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.</p>
+<p>The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &ldquo;top of the wall&rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. <code>person1</code>, <code>person2</code> -&gt; <code>weight</code>. <code>Person1</code> is by convention the one with the smaller <code>p_personid</code>. Note that comparing id&rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&rsquo;s with disastrous performance implications unless an implementation specific trick were used.</p>
+<p>In the next installment we will analyze an actual run.</p>
+<h3 id="snb-interactive-series">SNB Interactive Series</h3>
+<ul>
+<li><a href="/post/snb-interactive-part-1-what-is-snb-interactive-really-about">SNB Interactive, Part 1: What is SNB Interactive Really About?</a></li>
+<li><a href="/post/snb-interactive-part-2-modeling-choices">SNB Interactive, Part 2: Modeling Choices</a></li>
+<li><a href="/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso</a></li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/virtuoso">VIRTUOSO</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/index.html b/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/index.html
new file mode 100644
index 00000000..5e939d35
--- /dev/null
+++ b/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/index.html
@@ -0,0 +1,819 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">10 Jun 2015</strong></div>
+        
+        
+          <i>Note: this post is a continuation of &#34;SNB Interactive, Part 2: Modeling Choices&#34; post by Orri Erling.</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.</p>
+<p>The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, <em>per se,</em> since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.</p>
+<p>The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.</p>
+<p>The test system is the same as used in the <a href="http://www.openlinksw.com/weblog/oerling/?id=1739">TPC-H series</a>: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the <a href="https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics">feature/analytics branch</a> of <a href="https://github.com/v7fasttrack/virtuoso-opensource/">v7fasttrack, available from www.github.com</a>.</p>
+<p>The dataset is the SNB 300G set, with:</p>
+<table>
+<thead>
+<tr>
+<th>1,136,127</th>
+<th>persons</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>125,249,604</td>
+<td>knows edges</td>
+</tr>
+<tr>
+<td>847,886,644</td>
+<td>posts, including replies</td>
+</tr>
+<tr>
+<td>1,145,893,841</td>
+<td>tags of posts or replies</td>
+</tr>
+<tr>
+<td>1,140,226,235</td>
+<td>likes of posts or replies</td>
+</tr>
+</tbody>
+</table>
+<p>As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.</p>
+<p>Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.</p>
+<p><strong>Duration:</strong> 10:41.251<br>
+<strong>Throughput:</strong> 623.71 (op/s)</p>
+<p>The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.</p>
+<table>
+<thead>
+<tr>
+<th>% of total</th>
+<th>total_wait</th>
+<th>name</th>
+<th>count</th>
+<th>mean</th>
+<th>min</th>
+<th>max</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>20%</td>
+<td>4,231,130</td>
+<td>LdbcQuery5</td>
+<td>656</td>
+<td>6,449.89</td>
+<td>245</td>
+<td>10,311</td>
+</tr>
+<tr>
+<td>11%</td>
+<td>2,272,954</td>
+<td>LdbcQuery8</td>
+<td>18,354</td>
+<td>123.84</td>
+<td>14</td>
+<td>2,240</td>
+</tr>
+<tr>
+<td>10%</td>
+<td>2,200,718</td>
+<td>LdbcQuery3</td>
+<td>388</td>
+<td>5,671.95</td>
+<td>468</td>
+<td>17,368</td>
+</tr>
+<tr>
+<td>7.3%</td>
+<td>1,561,382</td>
+<td>LdbcQuery14</td>
+<td>1,124</td>
+<td>1,389.13</td>
+<td>4</td>
+<td>5,724</td>
+</tr>
+<tr>
+<td>6.7%</td>
+<td>1,441,575</td>
+<td>LdbcQuery12</td>
+<td>1,252</td>
+<td>1,151.42</td>
+<td>15</td>
+<td>3,273</td>
+</tr>
+<tr>
+<td>6.5%</td>
+<td>1,396,932</td>
+<td>LdbcQuery10</td>
+<td>1,252</td>
+<td>1,115.76</td>
+<td>13</td>
+<td>4,743</td>
+</tr>
+<tr>
+<td>5%</td>
+<td>1,064,457</td>
+<td>LdbcShortQuery3PersonFriends</td>
+<td>46,285</td>
+<td>22.9979</td>
+<td>0</td>
+<td>2,287</td>
+</tr>
+<tr>
+<td>4.9%</td>
+<td>1,047,536</td>
+<td>LdbcShortQuery2PersonPosts</td>
+<td>46,285</td>
+<td>22.6323</td>
+<td>0</td>
+<td>2,156</td>
+</tr>
+<tr>
+<td>4.1%</td>
+<td>885,102</td>
+<td>LdbcQuery6</td>
+<td>1,721</td>
+<td>514.295</td>
+<td>8</td>
+<td>5,227</td>
+</tr>
+<tr>
+<td>3.3%</td>
+<td>707,901</td>
+<td>LdbcQuery1</td>
+<td>2,117</td>
+<td>334.389</td>
+<td>28</td>
+<td>3,467</td>
+</tr>
+<tr>
+<td>2.4%</td>
+<td>521,738</td>
+<td>LdbcQuery4</td>
+<td>1,530</td>
+<td>341.005</td>
+<td>49</td>
+<td>2,774</td>
+</tr>
+<tr>
+<td>2.1%</td>
+<td>440,197</td>
+<td>LdbcShortQuery4MessageContent</td>
+<td>46,302</td>
+<td>9.50708</td>
+<td>0</td>
+<td>2,015</td>
+</tr>
+<tr>
+<td>1.9%</td>
+<td>407,450</td>
+<td>LdbcUpdate5AddForumMembership</td>
+<td>14,338</td>
+<td>28.4175</td>
+<td>0</td>
+<td>2,008</td>
+</tr>
+<tr>
+<td>1.9%</td>
+<td>405,243</td>
+<td>LdbcShortQuery7MessageReplies</td>
+<td>46,302</td>
+<td>8.75217</td>
+<td>0</td>
+<td>2,112</td>
+</tr>
+<tr>
+<td>1.9%</td>
+<td>404,002</td>
+<td>LdbcShortQuery6MessageForum</td>
+<td>46,302</td>
+<td>8.72537</td>
+<td>0</td>
+<td>1,968</td>
+</tr>
+<tr>
+<td>1.8%</td>
+<td>387,044</td>
+<td>LdbcUpdate3AddCommentLike</td>
+<td>12,659</td>
+<td>30.5746</td>
+<td>0</td>
+<td>2,060</td>
+</tr>
+<tr>
+<td>1.7%</td>
+<td>361,290</td>
+<td>LdbcShortQuery1PersonProfile</td>
+<td>46,285</td>
+<td>7.80577</td>
+<td>0</td>
+<td>2,015</td>
+</tr>
+<tr>
+<td>1.6%</td>
+<td>334,409</td>
+<td>LdbcShortQuery5MessageCreator</td>
+<td>46,302</td>
+<td>7.22234</td>
+<td>0</td>
+<td>2,055</td>
+</tr>
+<tr>
+<td>1%</td>
+<td>220,740</td>
+<td>LdbcQuery2</td>
+<td>1,488</td>
+<td>148.347</td>
+<td>2</td>
+<td>2,504</td>
+</tr>
+<tr>
+<td>0.96%</td>
+<td>205,910</td>
+<td>LdbcQuery7</td>
+<td>1,721</td>
+<td>119.646</td>
+<td>11</td>
+<td>2,295</td>
+</tr>
+<tr>
+<td>0.93%</td>
+<td>198,971</td>
+<td>LdbcUpdate2AddPostLike</td>
+<td>5,974</td>
+<td>33.3062</td>
+<td>0</td>
+<td>1,987</td>
+</tr>
+<tr>
+<td>0.88%</td>
+<td>189,871</td>
+<td>LdbcQuery11</td>
+<td>2,294</td>
+<td>82.7685</td>
+<td>4</td>
+<td>2,219</td>
+</tr>
+<tr>
+<td>0.85%</td>
+<td>182,964</td>
+<td>LdbcQuery13</td>
+<td>2,898</td>
+<td>63.1346</td>
+<td>1</td>
+<td>2,201</td>
+</tr>
+<tr>
+<td>0.74%</td>
+<td>158,188</td>
+<td>LdbcQuery9</td>
+<td>78</td>
+<td>2,028.05</td>
+<td>1,108</td>
+<td>4,183</td>
+</tr>
+<tr>
+<td>0.67%</td>
+<td>143,457</td>
+<td>LdbcUpdate7AddComment</td>
+<td>3,986</td>
+<td>35.9902</td>
+<td>1</td>
+<td>1,912</td>
+</tr>
+<tr>
+<td>0.26%</td>
+<td>54,947</td>
+<td>LdbcUpdate8AddFriendship</td>
+<td>571</td>
+<td>96.2294</td>
+<td>1</td>
+<td>988</td>
+</tr>
+<tr>
+<td>0.2%</td>
+<td>43,451</td>
+<td>LdbcUpdate6AddPost</td>
+<td>1,386</td>
+<td>31.3499</td>
+<td>1</td>
+<td>2,060</td>
+</tr>
+<tr>
+<td>0.01%</td>
+<td>1,848</td>
+<td>LdbcUpdate4AddForum</td>
+<td>103</td>
+<td>17.9417</td>
+<td>1</td>
+<td>65</td>
+</tr>
+<tr>
+<td>0.00%</td>
+<td>44</td>
+<td>LdbcUpdate1AddPerson</td>
+<td>2</td>
+<td>22</td>
+<td>10</td>
+<td>34</td>
+</tr>
+</tbody>
+</table>
+<p>At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.</p>
+<p>The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.</p>
+<p>The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:</p>
+<ul>
+<li>
+<p><em>Cardinality estimation under heavy data skew —</em> Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.</p>
+</li>
+<li>
+<p><em>Covering indices —</em> Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&rsquo;s creation date.</p>
+</li>
+<li>
+<p><em>Multi-hop graph traversal —</em> Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.</p>
+</li>
+<li>
+<p><em>Top <em>K</em> —</em> Most queries returning posts order results by descending date. Once there are at least <em>k</em> results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top <em>k</em>.</p>
+</li>
+<li>
+<p><em>Late projection —</em> Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.</p>
+</li>
+<li>
+<p><em>Materialization —</em> Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.</p>
+</li>
+<li>
+<p><em>Concurrency control —</em> Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.</p>
+</li>
+</ul>
+<p>In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.</p>
+<h3 id="snb-interactive-series">SNB Interactive Series</h3>
+<ul>
+<li><a href="/post/snb-interactive-part-1-what-is-snb-interactive-really-about">SNB Interactive, Part 1: What is SNB Interactive Really About?</a></li>
+<li><a href="/post/snb-interactive-part-2-modeling-choices">SNB Interactive, Part 2: Modeling Choices</a></li>
+<li><a href="/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso</a></li>
+</ul>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/social-network-benchmark-goals/index.html b/post/social-network-benchmark-goals/index.html
new file mode 100644
index 00000000..ef17fe6f
--- /dev/null
+++ b/post/social-network-benchmark-goals/index.html
@@ -0,0 +1,468 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Social Network Benchmark Goals</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Social Network Benchmark Goals</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Social Network Benchmark Goals</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Josep Larriba Pey</strong> / on <strong class="text-dark">14 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.</p>
+<p>From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.</p>
+<p>With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, <a href="/benchmarks/snb">SNB</a>, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.</p>
+<p>The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the <a href="https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen">LDBC Github repository</a>. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the <a href="https://arxiv.org/pdf/2010.12243.pdf">ACM SIGMOD programming contest 2014</a>.</p>
+<p>The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.</p>
+<p>More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            , <a href="/tags/bi">BI</a>
+            , <a href="/tags/graphalytics">GRAPHALYTICS</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/speeding-up-ldbc-snb-datagen/datagen_flow.png b/post/speeding-up-ldbc-snb-datagen/datagen_flow.png
new file mode 100644
index 00000000..5950a6b6
Binary files /dev/null and b/post/speeding-up-ldbc-snb-datagen/datagen_flow.png differ
diff --git a/post/speeding-up-ldbc-snb-datagen/index.html b/post/speeding-up-ldbc-snb-datagen/index.html
new file mode 100644
index 00000000..c96fb10f
--- /dev/null
+++ b/post/speeding-up-ldbc-snb-datagen/index.html
@@ -0,0 +1,730 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Speeding Up LDBC SNB Datagen</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Speeding Up LDBC SNB Datagen</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Speeding Up LDBC SNB Datagen</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-color"><a href="https://www.linkedin.com/in/dszakallas/">Dávid Szakállas</a></strong> / on <strong class="text-dark">12 Jun 2020</strong></div>
+        
+        
+          <i>Guest post.</i>
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.</p>
+<p>LDBC SNB provides <a href="https://github.com/ldbc/ldbc_snb_datagen">Datagen</a> (Data Generator), which produces synthetic datasets, mimicking a social network&rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).</p>
+<h2 id="overview">Overview</h2>
+<p>The benchmark&rsquo;s specification describes a social network <a href="https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf">data model</a> which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see <a href="#references">References</a>.</p>
+<p>Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).</p>
+<p><img src="datagen_flow.png" alt=""> \ <em>Figure 1. LDBC SNB Datagen Process on Hadoop</em></p>
+<p>In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.</p>
+<p><em>Note: The diagram shows the call sequence as implemented. All steps are sequential &ndash; including the relationship generation &ndash;, even in cases when the data dependencies would allow for parallelization.</em></p>
+<p>Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.<sup id="fnref:1"><a href="#fn:1" class="footnote-ref" role="doc-noteref">1</a></sup> A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this <em>edge as property</em> representation makes the data harder to handle in SQL than it would be with a flat join table.</p>
+<p>Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.<sup id="fnref:2"><a href="#fn:2" class="footnote-ref" role="doc-noteref">2</a></sup></p>
+<p>Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.</p>
+<h2 id="motivations-for-the-migration">Motivations for the migration</h2>
+<p>The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:</p>
+<ul>
+<li>
+<p><strong>Better memory utilization:</strong> MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.</p>
+</li>
+<li>
+<p><strong>Smaller codebase:</strong> The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.</p>
+</li>
+<li>
+<p><strong>Small entry cost:</strong> Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.</p>
+</li>
+<li>
+<p><strong>Incremental improvements:</strong> Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.</p>
+</li>
+<li>
+<p><strong>OSS, commodity:</strong> Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.</p>
+</li>
+</ul>
+<h2 id="first-steps">First steps</h2>
+<p>The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.</p>
+<ul>
+<li>
+<p><strong>Use your memory:</strong> A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using <code>MEMORY_AND_DISK</code>). In short, the default caching strategy was used everywhere.</p>
+</li>
+<li>
+<p><strong>Regression tests:</strong> Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.</p>
+</li>
+<li>
+<p><strong>Thread-safety concerns:</strong> Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&rsquo;t use thread-based parallelization for mappers and reducers.<sup id="fnref:3"><a href="#fn:3" class="footnote-ref" role="doc-noteref">3</a></sup> In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, <sup id="fnref:4"><a href="#fn:4" class="footnote-ref" role="doc-noteref">4</a></sup> which makes it somewhat harder to find potential unguarded shared variables.</p>
+</li>
+</ul>
+<h2 id="case-study-person-ranking">Case study: Person ranking</h2>
+<p>Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the <a href="#references">S3G2 paper [3]</a>.</p>
+<h3 id="the-original-mapreduce-version">The original MapReduce version</h3>
+<p><img src="person_ranking.svg" alt=""> \ <em>Figure 2. Diagram of the MapReduce code for ranking persons</em></p>
+<p>The implementation, shown in pseudocode above, works as follows:</p>
+<ol>
+<li>The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.</li>
+<li>The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &ldquo;side-channel&rdquo; file upon the completion of a reduce task.</li>
+<li>In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.</li>
+</ol>
+<p>Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.</p>
+<h3 id="the-migrated-version">The migrated version</h3>
+<p>Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.</p>
+<h2 id="benchmarks">Benchmarks</h2>
+<p>Benchmarks were carried out on AWS <a href="https://aws.amazon.com/emr/">EMR</a>, originally utilising <a href="https://aws.amazon.com/ec2/instance-types/i3/">i3.xlarge</a> instances because of their fast NVMe SSD storage and ample amount of RAM.</p>
+<p>The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.<sup id="fnref:5"><a href="#fn:5" class="footnote-ref" role="doc-noteref">5</a></sup> The MapReduce results were as follows:</p>
+<table>
+<thead>
+<tr>
+<th>SF</th>
+<th>workers</th>
+<th>Platform</th>
+<th>Instance Type</th>
+<th>runtime (min)</th>
+<th>runtime * worker/SF (min)</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>10</td>
+<td>1</td>
+<td>MapReduce</td>
+<td>i3.xlarge</td>
+<td>16</td>
+<td>1.60</td>
+</tr>
+<tr>
+<td>30</td>
+<td>1</td>
+<td>MapReduce</td>
+<td>i3.xlarge</td>
+<td>34</td>
+<td>1.13</td>
+</tr>
+<tr>
+<td>100</td>
+<td>3</td>
+<td>MapReduce</td>
+<td>i3.xlarge</td>
+<td>40</td>
+<td>1.20</td>
+</tr>
+<tr>
+<td>300</td>
+<td>9</td>
+<td>MapReduce</td>
+<td>i3.xlarge</td>
+<td>44</td>
+<td>1.32</td>
+</tr>
+</tbody>
+</table>
+<p>It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.</p>
+<p><img src="mr_sf100_cpu_load.png" alt=""> <br>
+<em>Figure 3. CPU Load for the Map Reduce cluster is bursty and less than<br>
+50% on average (SF100, 2nd graph shows master)</em></p>
+<p><img src="mr_sf100_mem_free.png" alt=""> <br>
+<em>Figure 4. The job only starts to consume memory when already 10 minutes<br>
+into the run (SF100, 2nd graph shows master)</em></p>
+<p>Let&rsquo;s see how Spark fares.</p>
+<table>
+<thead>
+<tr>
+<th>SF</th>
+<th>workers</th>
+<th>Platform</th>
+<th>Instance Type</th>
+<th>runtime (min)</th>
+<th>runtime * worker/SF (min)</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>10</td>
+<td>1</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>10</td>
+<td>1.00</td>
+</tr>
+<tr>
+<td>30</td>
+<td>1</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>21</td>
+<td>0.70</td>
+</tr>
+<tr>
+<td>100</td>
+<td>3</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>27</td>
+<td>0.81</td>
+</tr>
+<tr>
+<td>300</td>
+<td>9</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>36</td>
+<td>1.08</td>
+</tr>
+<tr>
+<td>1000</td>
+<td>30</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>47</td>
+<td>1.41</td>
+</tr>
+<tr>
+<td>3000</td>
+<td>90</td>
+<td>Spark</td>
+<td>i3.xlarge</td>
+<td>47</td>
+<td>1.41</td>
+</tr>
+</tbody>
+</table>
+<p>A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.</p>
+<p><img src="spark_sf100_cpu_load.png" alt=""> <br>
+<em>Figure 5. Full CPU utilization for Spark (SF100, last graph shows<br>
+master)</em></p>
+<p><img src="spark_sf100_mem_free.png" alt=""> <br>
+<em>Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)</em></p>
+<p>i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it <em>only</em> has a 300 GB SSD.</p>
+<table>
+<thead>
+<tr>
+<th>SF</th>
+<th>workers</th>
+<th>Platform</th>
+<th>Instance Type</th>
+<th>runtime (min)</th>
+<th>runtime * worker/SF (min)</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>100</td>
+<td>3</td>
+<td>Spark</td>
+<td>r5d.2xlarge</td>
+<td>16</td>
+<td>0.48</td>
+</tr>
+<tr>
+<td>300</td>
+<td>9</td>
+<td>Spark</td>
+<td>r5d.2xlarge</td>
+<td>21</td>
+<td>0.63</td>
+</tr>
+<tr>
+<td>1000</td>
+<td>30</td>
+<td>Spark</td>
+<td>r5d.2xlarge</td>
+<td>26</td>
+<td>0.78</td>
+</tr>
+<tr>
+<td>3000</td>
+<td>90</td>
+<td>Spark</td>
+<td>r5d.2xlarge</td>
+<td>25</td>
+<td>0.75</td>
+</tr>
+<tr>
+<td>10000</td>
+<td>303</td>
+<td>Spark</td>
+<td>r5d.2xlarge</td>
+<td>25</td>
+<td>0.75</td>
+</tr>
+</tbody>
+</table>
+<p>The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.</p>
+<h2 id="next-steps">Next steps</h2>
+<p>The next improvement is refactoring the serializers so they use Spark&rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.</p>
+<p>As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.</p>
+<p>The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for <a href="#references">generating delete operations [1]</a>. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.</p>
+<h2 id="acknowledgements">Acknowledgements</h2>
+<p>This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!</p>
+<h2 id="references">References</h2>
+<p>[1] <a href="https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf">Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&rsquo;s Data Generator</a></p>
+<p>[2] <a href="https://www.youtube.com/watch?v=ZQOLuCOOpSI">9th TUC Meeting &ndash; LDBC SNB Datagen Update &ndash; Arnau Prat (UPC)</a> - <a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf">slides</a></p>
+<p>[3] <a href="https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator">S3G2: a Scalable Structure-correlated Social Graph Generator</a></p>
+<p>[4] <a href="https://arxiv.org/abs/2001.02299">The LDBC Social Network Benchmark</a></p>
+<p>[5] <a href="https://ldbcouncil.org/">LDBC</a> - <a href="https://github.com/ldbc">LDBC GitHub organization</a></p>
+<div class="footnotes" role="doc-endnotes">
+<hr>
+<ol>
+<li id="fn:1">
+<p>Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&#160;<a href="#fnref:1" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:2">
+<p>It&rsquo;s hard to imagine this done declaratively in SQL.&#160;<a href="#fnref:2" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:3">
+<p>Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&#160;<a href="#fnref:3" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:4">
+<p>Although editors usually render these using different font styles.&#160;<a href="#fnref:4" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+<li id="fn:5">
+<p>With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&#160;<a href="#fnref:5" class="footnote-backref" role="doc-backlink">&#x21a9;&#xfe0e;</a></p>
+</li>
+</ol>
+</div>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/speeding-up-ldbc-snb-datagen/mr_sf100_cpu_load.png b/post/speeding-up-ldbc-snb-datagen/mr_sf100_cpu_load.png
new file mode 100644
index 00000000..f3e25a7f
Binary files /dev/null and b/post/speeding-up-ldbc-snb-datagen/mr_sf100_cpu_load.png differ
diff --git a/post/speeding-up-ldbc-snb-datagen/mr_sf100_mem_free.png b/post/speeding-up-ldbc-snb-datagen/mr_sf100_mem_free.png
new file mode 100644
index 00000000..6de95d93
Binary files /dev/null and b/post/speeding-up-ldbc-snb-datagen/mr_sf100_mem_free.png differ
diff --git a/post/speeding-up-ldbc-snb-datagen/person_ranking.svg b/post/speeding-up-ldbc-snb-datagen/person_ranking.svg
new file mode 100644
index 00000000..fcfd6251
--- /dev/null
+++ b/post/speeding-up-ldbc-snb-datagen/person_ranking.svg
@@ -0,0 +1,3 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg xmlns="http://www.w3.org/2000/svg" style="background-color: rgb(255, 255, 255);" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="311px" height="181px" viewBox="-0.5 -0.5 311 181" content="&lt;mxfile host=&quot;app.diagrams.net&quot; modified=&quot;2020-06-01T21:23:38.719Z&quot; agent=&quot;5.0 (Macintosh)&quot; version=&quot;13.1.12&quot; etag=&quot;DDCwwke2UKlWxX6FD3B5&quot; type=&quot;google&quot;&gt;&lt;diagram id=&quot;4gwJkugFw6lgm0VULjc-&quot;&gt;7Zhtr5owFMc/DYm+uDcFFPd26N1Dlj0kLtnrXlqhWaGsFtF9+p1KCzIwUy/XaLIXxvZ/zik9P84pqOPP0+17ifPksyCUOx4iW8dfOJ7n+kEAX1rZVcqbiVcJsWTEODXCkv2mRkRGLRih65ajEoIrlrfFSGQZjVRLw1KKsu22Erx91RzHtCMsI8y76g9GVGKymKJG/0BZnNgru8hYUmydjbBOMBHlgeQ/Of5cCqGqUbqdU67hWS5V3Lsj1npjkmbqlADDfYN5YXJzvIBDaEjYBoaxHlppJWBRwIWjyjf4Veh9hnNRSEYlmL7QspFteIpzx38LM5zCIMye13llHXiO1kKqT3Q3yscweagdTA4ot3k8S7s1AKWYYiLbbxB9Fwrzr5JQ+c0adFp/R1kFsFZIOnIL3v4+q50tHimKjFDNH4G5TJiiy7xCWkqNKkxUymHmwhBzFsPmFpyumsU2VCq6PXrH3bqOoAGpSKmSO3AxARNTeWVTuN7MaMlB0Vo/bHolrldqygkGpqL6q8u/QnWtqSqGqS/E4KNX0ldHCq9/fiSjcWWK9iato57AMwtiaASSkkJHXMAAjSDpeZUgTMN/dM5ZCV6YTcQpzk68paiU0D51DuOj+7zNHtyd15LBAC05ua+WbPrOmYXObNHut4uP5KEzfv2H24tJroQ07Y5Yps+xx8ds/J/lq7COnGnInOmiLl5JMRmxCnft8ODuXe720XGQ5fmPjN5yu4PXJnNku94Vz+xp58x2O3ggAn790NPRRJA41MXL4FgaPTB6WHgDsAg6LLzbYhFcj8Wsw8K/LRZu35vNMDBg2vxK3tsO/mvwn/4A&lt;/diagram&gt;&lt;/mxfile&gt;"><defs/><g><rect x="40" y="0" width="270" height="40" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe flex-start; width: 268px; height: 1px; padding-top: 20px; margin-left: 42px;"><div style="box-sizing: border-box; font-size: 0; text-align: left; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; "><div><font face="Courier New">map:       sortKey(p) -&gt; p<br />partition: TotalOrderPartitioner<br /></font></div></div></div></div></foreignObject><text x="42" y="24" fill="#000000" font-family="Helvetica" font-size="12px">map:       sortKey(p) -&gt; p...</text></switch></g><rect x="40" y="40" width="270" height="60" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe flex-start; width: 268px; height: 1px; padding-top: 70px; margin-left: 42px;"><div style="box-sizing: border-box; font-size: 0; text-align: left; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; "><div><font face="Courier New">setup:     i := taskId(); c = 0  </font></div><div><font face="Courier New">reduce:    (i, c++) -&gt; p</font></div><font face="Courier New">cleanup:   write(i, c)</font></div></div></div></foreignObject><text x="42" y="74" fill="#000000" font-family="Helvetica" font-size="12px">setup:     i := taskId(); c = 0...</text></switch></g><rect x="40" y="120" width="270" height="60" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe flex-start; width: 268px; height: 1px; padding-top: 150px; margin-left: 42px;"><div style="box-sizing: border-box; font-size: 0; text-align: left; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; "><div><font face="Courier New">setup:     c = {}; <br /></font></div><div><font face="Courier New">           for (i in 0..n) <br /></font></div><div><font face="Courier New">             c[i] = read(i) + c[i-1]</font></div><div><font face="Courier New">reduce:    c[i] -&gt; p</font><br /></div></div></div></div></foreignObject><text x="42" y="154" fill="#000000" font-family="Helvetica" font-size="12px">setup:     c = {};...</text></switch></g><ellipse cx="10" cy="20" rx="10" ry="10" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 20px; margin-left: 1px;"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">1</div></div></div></foreignObject><text x="10" y="24" fill="#000000" font-family="Helvetica" font-size="12px" text-anchor="middle">1</text></switch></g><ellipse cx="10" cy="70" rx="10" ry="10" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 70px; margin-left: 1px;"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">2</div></div></div></foreignObject><text x="10" y="74" fill="#000000" font-family="Helvetica" font-size="12px" text-anchor="middle">2</text></switch></g><ellipse cx="10" cy="150" rx="10" ry="10" fill="#ffffff" stroke="#000000" pointer-events="all"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"><div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 150px; margin-left: 1px;"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3</div></div></div></foreignObject><text x="10" y="154" fill="#000000" font-family="Helvetica" font-size="12px" text-anchor="middle">3</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a transform="translate(0,-5)" xlink:href="https://desk.draw.io/support/solutions/articles/16000042487" target="_blank"><text text-anchor="middle" font-size="10px" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/post/speeding-up-ldbc-snb-datagen/spark_sf100_cpu_load.png b/post/speeding-up-ldbc-snb-datagen/spark_sf100_cpu_load.png
new file mode 100644
index 00000000..0e6f5b4e
Binary files /dev/null and b/post/speeding-up-ldbc-snb-datagen/spark_sf100_cpu_load.png differ
diff --git a/post/speeding-up-ldbc-snb-datagen/spark_sf100_mem_free.png b/post/speeding-up-ldbc-snb-datagen/spark_sf100_mem_free.png
new file mode 100644
index 00000000..1fb8ae73
Binary files /dev/null and b/post/speeding-up-ldbc-snb-datagen/spark_sf100_mem_free.png differ
diff --git a/post/the-day-of-graph-analytics/index.html b/post/the-day-of-graph-analytics/index.html
new file mode 100644
index 00000000..9bb205c3
--- /dev/null
+++ b/post/the-day-of-graph-analytics/index.html
@@ -0,0 +1,498 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The Day of Graph Analytics</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">The Day of Graph Analytics</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">The Day of Graph Analytics</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Orri Erling</strong> / on <strong class="text-dark">09 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.</p>
+<p>So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.</p>
+<p>The BI part is like TPC-H, except for adding the following challenges:</p>
+<ul>
+<li>
+<p>Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.</p>
+</li>
+<li>
+<p>Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.</p>
+</li>
+<li>
+<p>Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.</p>
+</li>
+<li>
+<p>Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.</p>
+</li>
+<li>
+<p>Running one query with parameters from different buckets, implying different best plan.</p>
+</li>
+<li>
+<p>Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.</p>
+</li>
+<li>
+<p>Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.</p>
+</li>
+<li>
+<p>More unions and outer joins.</p>
+</li>
+</ul>
+<p>The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.</p>
+<p>For rules and metric, we can use the TPC-H or <a href="http://www.tpc.org/tpcds/default.asp">TPC-DS</a> ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and <a href="http://www.openstreetmap.org/">Open Street Map</a>. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.</p>
+<p>Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.</p>
+<p>As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &ldquo;Platonic&rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.</p>
+<p>So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.</p>
+<p>The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.</p>
+<p>This brings us to the graph analytics proper, which is often done in BSP style, e.g. <a href="http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing">Pregel</a>, <a href="http://giraph.apache.org">Giraph</a>, <a href="http://uzh.github.io/signal-collect/">Signal-Collect</a>, some but not all <a href="http://ppl.stanford.edu/main/green_marl.html">Green-Marl</a> applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.</p>
+<p>With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as <a href="http://graphbench.org/">graphbench.org</a> but will be adapted to the SNB dataset.</p>
+<p>The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/analytics">ANALYTICS</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/the-ldbc-datagen-community-structure/index.html b/post/the-ldbc-datagen-community-structure/index.html
new file mode 100644
index 00000000..ec9fcecf
--- /dev/null
+++ b/post/the-ldbc-datagen-community-structure/index.html
@@ -0,0 +1,669 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Datagen Community Structure</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">The LDBC Datagen Community Structure</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">The LDBC Datagen Community Structure</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Arnau Prat</strong> / on <strong class="text-dark">15 Mar 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.</p>
+<p>The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 <a href="#references">[1]</a>. Here we summarize the paper and its contributions and findings.</p>
+<p>Existing synthetic graph generators such as Rmat <a href="#references">[1]</a> and Mag <a href="#references">[2]</a>, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR <a href="#references">[3]</a>, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.</p>
+<p>However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of <a href="#references">[1]</a> set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to <a href="#references">[4]</a>.</p>
+<table>
+<thead>
+<tr>
+<th></th>
+<th><em>Nodes</em></th>
+<th><em>Edges</em></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><em>Amazon</em></td>
+<td>334863</td>
+<td>925872</td>
+</tr>
+<tr>
+<td><em>Dblp</em></td>
+<td>317080</td>
+<td>1049866</td>
+</tr>
+<tr>
+<td><em>Youtube</em></td>
+<td>1134890</td>
+<td>2987624</td>
+</tr>
+<tr>
+<td><em>Livejournal</em></td>
+<td>3997962</td>
+<td>34681189</td>
+</tr>
+</tbody>
+</table>
+<p>The authors of <a href="#references">[1]</a> selected  a set of statistical indicators to<br>
+characterize the communities:</p>
+<ul>
+<li>The clustering coefficient</li>
+<li>The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.</li>
+<li>The bridge ratio, which is the ratio of edges whose removal disconnects the community.</li>
+<li>The diameter</li>
+<li>The conductance</li>
+<li>The size</li>
+</ul>
+<p>The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.</p>
+<ul>
+<li>Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.</li>
+<li>Most of the communities are small (10 or less nodes).</li>
+<li>In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.</li>
+</ul>
+<table>
+<thead>
+<tr>
+<th style="text-align:center"></th>
+<th style="text-align:center"></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td style="text-align:center"><img src="index.png" alt=""></td>
+<td style="text-align:center"><img src="index2.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Clustering Coefficient</td>
+<td style="text-align:center">TPR</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index3.png" alt=""></td>
+<td style="text-align:center"><img src="index4.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Bridge Ratio</td>
+<td style="text-align:center">Diameter</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index5.png" alt=""></td>
+<td style="text-align:center"><img src="index6.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Conductance</td>
+<td style="text-align:center">Size</td>
+</tr>
+</tbody>
+</table>
+<p>The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.</p>
+<table>
+<thead>
+<tr>
+<th style="text-align:center"></th>
+<th style="text-align:center"></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td style="text-align:center"><img src="index8.png" alt=""></td>
+<td style="text-align:center"><img src="index9.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Clustering Coefficient</td>
+<td style="text-align:center">TPR</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index10.png" alt=""></td>
+<td style="text-align:center"><img src="index11.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Bridge Ratio</td>
+<td style="text-align:center">TPRDiameter</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index11.png" alt=""></td>
+<td style="text-align:center"><img src="index12.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Conductance</td>
+<td style="text-align:center">Size</td>
+</tr>
+</tbody>
+</table>
+<p>The main conclusions that can be extracted from DATAGEN can be summarized asfollows:</p>
+<ul>
+<li>DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.</li>
+<li>The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.</li>
+<li>Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.</li>
+<li>The diameter is small like in the real graphs.</li>
+<li>It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.</li>
+</ul>
+<p>Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:</p>
+<ul>
+<li>LFR graphs donot show the multimodal distribution observed in real graphs</li>
+<li>Only the diameter shows a similar shape as in the ground truth.</li>
+</ul>
+<table>
+<thead>
+<tr>
+<th style="text-align:center"></th>
+<th style="text-align:center"></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td style="text-align:center"><img src="index13.png" alt=""></td>
+<td style="text-align:center"><img src="index14.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Clustering Coefficient</td>
+<td style="text-align:center">TPR</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index15.png" alt=""></td>
+<td style="text-align:center"><img src="index16.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Bridge Ratio</td>
+<td style="text-align:center">TPRDiameter</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index17.png" alt=""></td>
+<td style="text-align:center"><img src="index18.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Conductance</td>
+<td style="text-align:center">Size</td>
+</tr>
+</tbody>
+</table>
+<p>To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.</p>
+<table>
+<thead>
+<tr>
+<th style="text-align:center"></th>
+<th style="text-align:center"></th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td style="text-align:center"><img src="index19.png" alt=""></td>
+<td style="text-align:center"><img src="index20.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Clustering Coefficient</td>
+<td style="text-align:center">TPR</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index21.png" alt=""></td>
+<td style="text-align:center"><img src="index22.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Bridge Ratio</td>
+<td style="text-align:center">TPRDiameter</td>
+</tr>
+<tr>
+<td style="text-align:center"><img src="index23.png" alt=""></td>
+<td style="text-align:center"><img src="index24.png" alt=""></td>
+</tr>
+<tr>
+<td style="text-align:center">Conductance</td>
+<td style="text-align:center">Size</td>
+</tr>
+</tbody>
+</table>
+<p>We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!</p>
+<h4 id="references">References</h4>
+<p>[1] Arnau Prat-Pérez, <a href="http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David">David Domínguez-Sal</a>: How community-like is the structure of synthetically generated graphs? <a href="http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14">GRADES 2014</a></p>
+<p>[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014</p>
+<p>[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics</p>
+<p>[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/datagen">DATAGEN</a>
+            , <a href="/tags/social-network">SOCIAL NETWORK</a>
+            , <a href="/tags/snb">SNB</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/the-ldbc-datagen-community-structure/index.png b/post/the-ldbc-datagen-community-structure/index.png
new file mode 100644
index 00000000..0aed5e94
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index10.png b/post/the-ldbc-datagen-community-structure/index10.png
new file mode 100644
index 00000000..95eb2b08
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index10.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index11.png b/post/the-ldbc-datagen-community-structure/index11.png
new file mode 100644
index 00000000..e7ffcb90
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index11.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index12.png b/post/the-ldbc-datagen-community-structure/index12.png
new file mode 100644
index 00000000..d939d4fe
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index12.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index13.png b/post/the-ldbc-datagen-community-structure/index13.png
new file mode 100644
index 00000000..66ae800d
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index13.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index14.png b/post/the-ldbc-datagen-community-structure/index14.png
new file mode 100644
index 00000000..90059156
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index14.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index15.png b/post/the-ldbc-datagen-community-structure/index15.png
new file mode 100644
index 00000000..cdabb84c
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index15.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index16.png b/post/the-ldbc-datagen-community-structure/index16.png
new file mode 100644
index 00000000..2e88a893
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index16.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index17.png b/post/the-ldbc-datagen-community-structure/index17.png
new file mode 100644
index 00000000..c27044ff
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index17.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index18.png b/post/the-ldbc-datagen-community-structure/index18.png
new file mode 100644
index 00000000..6619a0fc
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index18.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index19.png b/post/the-ldbc-datagen-community-structure/index19.png
new file mode 100644
index 00000000..2832129e
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index19.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index2.png b/post/the-ldbc-datagen-community-structure/index2.png
new file mode 100644
index 00000000..a3741101
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index2.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index20.png b/post/the-ldbc-datagen-community-structure/index20.png
new file mode 100644
index 00000000..401fd3eb
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index20.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index21.png b/post/the-ldbc-datagen-community-structure/index21.png
new file mode 100644
index 00000000..465c8329
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index21.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index22.png b/post/the-ldbc-datagen-community-structure/index22.png
new file mode 100644
index 00000000..3ad5705c
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index22.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index23.png b/post/the-ldbc-datagen-community-structure/index23.png
new file mode 100644
index 00000000..5d54188e
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index23.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index24.png b/post/the-ldbc-datagen-community-structure/index24.png
new file mode 100644
index 00000000..ddd0af66
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index24.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index3.png b/post/the-ldbc-datagen-community-structure/index3.png
new file mode 100644
index 00000000..8eb9b226
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index3.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index4.png b/post/the-ldbc-datagen-community-structure/index4.png
new file mode 100644
index 00000000..62b38989
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index4.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index5.png b/post/the-ldbc-datagen-community-structure/index5.png
new file mode 100644
index 00000000..eca7bc66
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index5.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index6.png b/post/the-ldbc-datagen-community-structure/index6.png
new file mode 100644
index 00000000..41291a40
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index6.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index7.png b/post/the-ldbc-datagen-community-structure/index7.png
new file mode 100644
index 00000000..8ceafda3
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index7.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index8.png b/post/the-ldbc-datagen-community-structure/index8.png
new file mode 100644
index 00000000..e240c0b0
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index8.png differ
diff --git a/post/the-ldbc-datagen-community-structure/index9.png b/post/the-ldbc-datagen-community-structure/index9.png
new file mode 100644
index 00000000..44348123
Binary files /dev/null and b/post/the-ldbc-datagen-community-structure/index9.png differ
diff --git a/post/using-ldbc-spb-to-find-owlim-performance-issues/16-2-Performance.png b/post/using-ldbc-spb-to-find-owlim-performance-issues/16-2-Performance.png
new file mode 100644
index 00000000..1259ebcf
Binary files /dev/null and b/post/using-ldbc-spb-to-find-owlim-performance-issues/16-2-Performance.png differ
diff --git a/post/using-ldbc-spb-to-find-owlim-performance-issues/8-0-Performance.png b/post/using-ldbc-spb-to-find-owlim-performance-issues/8-0-Performance.png
new file mode 100644
index 00000000..7553108f
Binary files /dev/null and b/post/using-ldbc-spb-to-find-owlim-performance-issues/8-0-Performance.png differ
diff --git a/post/using-ldbc-spb-to-find-owlim-performance-issues/index.html b/post/using-ldbc-spb-to-find-owlim-performance-issues/index.html
new file mode 100644
index 00000000..b1f36472
--- /dev/null
+++ b/post/using-ldbc-spb-to-find-owlim-performance-issues/index.html
@@ -0,0 +1,475 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Using LDBC SPB to Find OWLIM Performance Issues</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Using LDBC SPB to Find OWLIM Performance Issues</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Venelin Kotsev</strong> / on <strong class="text-dark">20 Aug 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.</li>
+</ul>
+<p>Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.</p>
+<p>We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.</p>
+<p>Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.</p>
+<p><img src="16-2-Performance.png" alt="image"></p>
+<p>Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.</p>
+<p><img src="8-0-Performance.png" alt="image"></p>
+<p>Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.</p>
+<p>Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.</p>
+<p>An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called <em>checkConformance</em>. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/ldbc">LDBC</a>
+            , <a href="/tags/spb">SPB</a>
+            , <a href="/tags/rdf">RDF</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/index.html b/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/index.html
new file mode 100644
index 00000000..7ba58112
--- /dev/null
+++ b/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/index.html
@@ -0,0 +1,464 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">LDBC</strong> / on <strong class="text-dark">14 Oct 2014</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the <em>benchmarks</em> menu on this site.</p>
+<p>Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.</p>
+<p>While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.</p>
+<p>We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.</p>
+<p>Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.</p>
+<p>In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/ldbc">LDBC</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/index.html b/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/index.html
new file mode 100644
index 00000000..14f9b956
--- /dev/null
+++ b/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/index.html
@@ -0,0 +1,468 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Why Do We Need an LDBC SNB Specific Workload Driver?</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Why Do We Need an LDBC SNB-Specific Workload Driver?</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Why Do We Need an LDBC SNB-Specific Workload Driver?</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8">
+        <!-- post thumb -->
+        
+        <div class="card-meta text-uppercase mb-2">by <strong class="text-dark">Alex Averbuch</strong> / on <strong class="text-dark">21 Apr 2015</strong></div>
+        
+        
+        
+        <div class="position-relative mb-5">
+          
+          
+        </div>
+        <div class="content">
+          <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &ldquo;graph&rdquo; is the word that best captures the novelty and difficulty of this work.</p>
+<p><strong>Workload Execution - Traditional vs Graph</strong></p>
+<p>Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.</p>
+<p>To understand what is meant by &ldquo;traditional relational workloads&rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &ldquo;dependency&rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order <em>for a given user</em>. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.</p>
+<p>A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.</p>
+<p>Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. <em>Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.</em></p>
+<p><strong>Because it&rsquo;s a graph</strong></p>
+<p>In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.</p>
+
+        </div>
+        <!-- tags -->
+        <div class="mb-3">
+          <h5 class="d-inline-block mr-3">Tags:</h5>
+          <ul class="list-inline d-inline-block">
+            <a href="/tags/snb">SNB</a>
+            , <a href="/tags/driver">DRIVER</a>
+            , <a href="/tags/interactive">INTERACTIVE</a>
+            
+          </ul>
+        </div>
+        
+        
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+<!-- /blog details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/posts/index.html b/posts/index.html
new file mode 100644
index 00000000..e631f434
--- /dev/null
+++ b/posts/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html>
+<head>
+  <title>/post</title>
+  <link rel="canonical" href="https://ldbcouncil.org/post"/>
+  <meta name="robots" content="noindex">
+  <meta charset="utf-8" />
+  <meta http-equiv="refresh" content="0; url=/post" />
+  </head>
+</html>
diff --git a/publication/david-puroja-msc/cite.bib b/publication/david-puroja-msc/cite.bib
new file mode 100644
index 00000000..d8e1c566
--- /dev/null
+++ b/publication/david-puroja-msc/cite.bib
@@ -0,0 +1,9 @@
+@mastersthesis{david-puroja-msc,
+ author = {David Püroja},
+ school = {Universiteit van Amsterdam},
+ title = {LDBC Social Network Benchmark Interactive v2},
+ type = {Master\textquoterights thesis},
+ url = {https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf},
+ year = {2023}
+}
+
diff --git a/publication/david-puroja-msc/index.html b/publication/david-puroja-msc/index.html
new file mode 100644
index 00000000..7dbd309e
--- /dev/null
+++ b/publication/david-puroja-msc/index.html
@@ -0,0 +1,520 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Social Network Benchmark Interactive v2</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/david-puroja-msc/">LDBC Social Network Benchmark Interactive v2</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+David Püroja
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/david-puroja-msc/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-bookscrclinked-14-boncz-ep-14/cite.bib b/publication/dblp-bookscrclinked-14-boncz-ep-14/cite.bib
new file mode 100644
index 00000000..47f0777c
--- /dev/null
+++ b/publication/dblp-bookscrclinked-14-boncz-ep-14/cite.bib
@@ -0,0 +1,10 @@
+@incollection{DBLP:books/crc/linked14/BonczEP14,
+ author = {Boncz, Peter A. and Erling, Orri and Pham, Minh-Duc},
+ booktitle = {Linked Data Management},
+ date = {2014},
+ pages = {239--259},
+ publisher = {Chapman and Hall/CRC},
+ title = {Experiences with Virtuoso Cluster RDF Column Store},
+ url = {http://www.crcnetbase.com/doi/abs/10.1201/b16859-13}
+}
+
diff --git a/publication/dblp-bookscrclinked-14-boncz-ep-14/index.html b/publication/dblp-bookscrclinked-14-boncz-ep-14/index.html
new file mode 100644
index 00000000..133f203e
--- /dev/null
+++ b/publication/dblp-bookscrclinked-14-boncz-ep-14/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Experiences with Virtuoso Cluster RDF Column Store</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-bookscrclinked-14-boncz-ep-14/">Experiences with Virtuoso Cluster RDF Column Store</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Orri Erling,
+  
+
+
+  and
+
+Minh-Duc Pham
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Linked Data Management</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-bookscrclinked-14-boncz-ep-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="http://www.crcnetbase.com/doi/abs/10.1201/b16859-13" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confamw-angles-br-13/cite.bib b/publication/dblp-confamw-angles-br-13/cite.bib
new file mode 100644
index 00000000..1976ae79
--- /dev/null
+++ b/publication/dblp-confamw-angles-br-13/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/amw/AnglesBR13,
+ author = {Angles, Renzo and Barceló, Pablo and Rios, Gonzalo},
+ booktitle = {Alberto Mendelzon International Workshop},
+ date = {2013},
+ publisher = {CEUR-WS.org},
+ series = {CEUR Workshop Proceedings},
+ title = {A Practical Query Language for Graph DBs},
+ url = {http://ceur-ws.org/Vol-1087/paper8.pdf},
+ volume = {1087}
+}
+
diff --git a/publication/dblp-confamw-angles-br-13/index.html b/publication/dblp-confamw-angles-br-13/index.html
new file mode 100644
index 00000000..9921f2f3
--- /dev/null
+++ b/publication/dblp-confamw-angles-br-13/index.html
@@ -0,0 +1,532 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>A Practical Query Language for Graph DBs</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confamw-angles-br-13/">A Practical Query Language for Graph DBs</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Pablo Barceló,
+  
+
+
+  and
+
+Gonzalo Rios
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Alberto Mendelzon International Workshop</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://ceur-ws.org/Vol-1087/paper8.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confamw-angles-br-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confcikm-gubichev-n-12/cite.bib b/publication/dblp-confcikm-gubichev-n-12/cite.bib
new file mode 100644
index 00000000..a8345d12
--- /dev/null
+++ b/publication/dblp-confcikm-gubichev-n-12/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/cikm/GubichevN12,
+ author = {Gubichev, Andrey and Neumann, Thomas},
+ booktitle = {CIKM},
+ date = {2012},
+ doi = {10.1145/2396761.2398460},
+ pages = {1497--1501},
+ publisher = {ACM},
+ title = {Fast approximation of Steiner trees in large graphs},
+ url = {https://doi.org/10.1145/2396761.2398460}
+}
+
diff --git a/publication/dblp-confcikm-gubichev-n-12/index.html b/publication/dblp-confcikm-gubichev-n-12/index.html
new file mode 100644
index 00000000..5d3c93c1
--- /dev/null
+++ b/publication/dblp-confcikm-gubichev-n-12/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Fast approximation of Steiner trees in large graphs</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confcikm-gubichev-n-12/">Fast approximation of Steiner trees in large graphs</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CIKM</div>
+  
+
+  <div><b>Publication year:</b> 2012</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confcikm-gubichev-n-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2396761.2398460" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2396761.2398460" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confedbt-gubichev-014/cite.bib b/publication/dblp-confedbt-gubichev-014/cite.bib
new file mode 100644
index 00000000..acec96ad
--- /dev/null
+++ b/publication/dblp-confedbt-gubichev-014/cite.bib
@@ -0,0 +1,10 @@
+@inproceedings{DBLP:conf/edbt/Gubichev014,
+ author = {Gubichev, Andrey and Neumann, Thomas},
+ booktitle = {EDBT},
+ date = {2014},
+ doi = {10.5441/002/edbt.2014.40},
+ pages = {439--450},
+ title = {Exploiting the query structure for efficient join ordering in SPARQL queries},
+ url = {https://doi.org/10.5441/002/edbt.2014.40}
+}
+
diff --git a/publication/dblp-confedbt-gubichev-014/index.html b/publication/dblp-confedbt-gubichev-014/index.html
new file mode 100644
index 00000000..99c5805b
--- /dev/null
+++ b/publication/dblp-confedbt-gubichev-014/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Exploiting the query structure for efficient join ordering in SPARQL queries</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confedbt-gubichev-014/">Exploiting the query structure for efficient join ordering in SPARQL queries</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> EDBT</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confedbt-gubichev-014/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.5441/002/edbt.2014.40" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.5441/002/edbt.2014.40" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confedbt-tsialiamanis-sfcb-12/cite.bib b/publication/dblp-confedbt-tsialiamanis-sfcb-12/cite.bib
new file mode 100644
index 00000000..284b208a
--- /dev/null
+++ b/publication/dblp-confedbt-tsialiamanis-sfcb-12/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/edbt/TsialiamanisSFCB12,
+ author = {Tsialiamanis, Petros and Sidirourgos, Lefteris and Fundulaki, Irini and Christophides, Vassilis and Boncz, Peter A.},
+ booktitle = {EDBT},
+ date = {2012},
+ doi = {10.1145/2247596.2247635},
+ pages = {324--335},
+ publisher = {ACM},
+ title = {Heuristics-based query optimisation for SPARQL},
+ url = {https://doi.org/10.1145/2247596.2247635}
+}
+
diff --git a/publication/dblp-confedbt-tsialiamanis-sfcb-12/index.html b/publication/dblp-confedbt-tsialiamanis-sfcb-12/index.html
new file mode 100644
index 00000000..cbd320b2
--- /dev/null
+++ b/publication/dblp-confedbt-tsialiamanis-sfcb-12/index.html
@@ -0,0 +1,546 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Heuristics based query optimisation for SPARQL</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confedbt-tsialiamanis-sfcb-12/">Heuristics-based query optimisation for SPARQL</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Petros Tsialiamanis,
+  
+    Lefteris Sidirourgos,
+  
+    Irini Fundulaki,
+  
+    Vassilis Christophides,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> EDBT</div>
+  
+
+  <div><b>Publication year:</b> 2012</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confedbt-tsialiamanis-sfcb-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2247596.2247635" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2247596.2247635" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confgrades-leo-b-17/cite.bib b/publication/dblp-confgrades-leo-b-17/cite.bib
new file mode 100644
index 00000000..10eae98e
--- /dev/null
+++ b/publication/dblp-confgrades-leo-b-17/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/grades/LeoB17,
+ author = {Leo, Dean De and Boncz, Peter A.},
+ booktitle = {GRADES at SIGMOD},
+ date = {2017},
+ doi = {10.1145/3078447.3078457},
+ pages = {10:1--10:8},
+ publisher = {ACM},
+ title = {Extending SQL for Computing Shortest Paths},
+ url = {https://doi.org/10.1145/3078447.3078457}
+}
+
diff --git a/publication/dblp-confgrades-leo-b-17/index.html b/publication/dblp-confgrades-leo-b-17/index.html
new file mode 100644
index 00000000..9ddf3c10
--- /dev/null
+++ b/publication/dblp-confgrades-leo-b-17/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Extending SQL for Computing Shortest Paths</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confgrades-leo-b-17/">Extending SQL for Computing Shortest Paths</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Dean De Leo
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2017</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-leo-b-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3078447.3078457" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3078447.3078457" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confgrades-ngai-hhi-17/cite.bib b/publication/dblp-confgrades-ngai-hhi-17/cite.bib
new file mode 100644
index 00000000..a246c6bf
--- /dev/null
+++ b/publication/dblp-confgrades-ngai-hhi-17/cite.bib
@@ -0,0 +1,10 @@
+@inproceedings{DBLP:conf/grades/NgaiHHI17,
+ author = {Ngai, Wing Lung and Hegeman, Tim and Heldens, Stijn and Iosup, Alexandru},
+ booktitle = {GRADES at SIGMOD},
+ date = {2017},
+ doi = {10.1145/3078447.3078455},
+ pages = {8:1--8:6},
+ publisher = {ACM},
+ title = {Granula: Toward Fine-grained Performance Analysis of Large-scale Graph Processing Platforms}
+}
+
diff --git a/publication/dblp-confgrades-ngai-hhi-17/index.html b/publication/dblp-confgrades-ngai-hhi-17/index.html
new file mode 100644
index 00000000..bf9ee599
--- /dev/null
+++ b/publication/dblp-confgrades-ngai-hhi-17/index.html
@@ -0,0 +1,528 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Granula: Toward Fine grained Performance Analysis of Large scale Graph Processing Platforms</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confgrades-ngai-hhi-17/">Granula: Toward Fine-grained Performance Analysis of Large-scale Graph Processing Platforms</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Wing Lung Ngai,
+  
+    Tim Hegeman,
+  
+    Stijn Heldens,
+  
+
+
+  and
+
+Alexandru Iosup
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2017</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-ngai-hhi-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3078447.3078455" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confgrades-prat-perez-gskdb-17/cite.bib b/publication/dblp-confgrades-prat-perez-gskdb-17/cite.bib
new file mode 100644
index 00000000..3988cd30
--- /dev/null
+++ b/publication/dblp-confgrades-prat-perez-gskdb-17/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/grades/Prat-PerezGSKDB17,
+ author = {Prat-Pérez, Arnau and Guisado-Gámez, Joan and Salas, Xavier Fernández and Koupy, Petr and Depner, Siegfried and Bartolini, Davide Basilio},
+ booktitle = {GRADES at SIGMOD},
+ date = {2017},
+ doi = {10.1145/3078447.3078453},
+ pages = {6:1--6:6},
+ publisher = {ACM},
+ title = {Towards a property graph generator for benchmarking},
+ url = {https://doi.org/10.1145/3078447.3078453}
+}
+
diff --git a/publication/dblp-confgrades-prat-perez-gskdb-17/index.html b/publication/dblp-confgrades-prat-perez-gskdb-17/index.html
new file mode 100644
index 00000000..265cefdb
--- /dev/null
+++ b/publication/dblp-confgrades-prat-perez-gskdb-17/index.html
@@ -0,0 +1,548 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Towards a property graph generator for benchmarking</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confgrades-prat-perez-gskdb-17/">Towards a property graph generator for benchmarking</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez,
+  
+    Joan Guisado-Gámez,
+  
+    Xavier Fernández Salas,
+  
+    Petr Koupy,
+  
+    Siegfried Depner,
+  
+
+
+  and
+
+Davide Basilio Bartolini
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2017</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-prat-perez-gskdb-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3078447.3078453" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3078447.3078453" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confgrades-szarnyas-pampkeb-18/cite.bib b/publication/dblp-confgrades-szarnyas-pampkeb-18/cite.bib
new file mode 100644
index 00000000..dbc4fba2
--- /dev/null
+++ b/publication/dblp-confgrades-szarnyas-pampkeb-18/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/grades/SzarnyasPAMPKEB18,
+ author = {Szárnyas, Gábor and Prat-Pérez, Arnau and Averbuch, Alex and Marton, József and Paradies, Marcus and Kaufmann, Moritz and Erling, Orri and Boncz, Peter A. and Haprian, Vlad and Antal, János Benjamin},
+ booktitle = {GRADES-NDA at SIGMOD/PODS},
+ date = {2018},
+ doi = {10.1145/3210259.3210268},
+ pages = {9:1--9:11},
+ publisher = {ACM},
+ title = {An early look at the LDBC Social Network Benchmark's Business Intelligence workload},
+ url = {https://ldbcouncil.org/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf}
+}
+
diff --git a/publication/dblp-confgrades-szarnyas-pampkeb-18/index.html b/publication/dblp-confgrades-szarnyas-pampkeb-18/index.html
new file mode 100644
index 00000000..5cc40ea9
--- /dev/null
+++ b/publication/dblp-confgrades-szarnyas-pampkeb-18/index.html
@@ -0,0 +1,550 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>An early look at the LDBC Social Network Benchmark&#39;s Business Intelligence workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confgrades-szarnyas-pampkeb-18/">An early look at the LDBC Social Network Benchmark&#39;s Business Intelligence workload</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Arnau Prat-Pérez,
+  
+    Alex Averbuch,
+  
+    József Marton,
+  
+    Marcus Paradies,
+  
+    Moritz Kaufmann,
+  
+    Orri Erling,
+  
+    Peter A. Boncz,
+  
+    Vlad Haprian,
+  
+
+
+  and
+
+János Benjamin Antal
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES-NDA at SIGMOD/PODS</div>
+  
+
+  <div><b>Publication year:</b> 2018</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-szarnyas-pampkeb-18/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3210259.3210268" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conficde-gubichev-ab-14/cite.bib b/publication/dblp-conficde-gubichev-ab-14/cite.bib
new file mode 100644
index 00000000..80c4f64a
--- /dev/null
+++ b/publication/dblp-conficde-gubichev-ab-14/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/icde/GubichevAB14,
+ author = {Gubichev, Andrey and Angles, Renzo and Boncz, Peter A.},
+ booktitle = {GDM at ICDE},
+ date = {2014},
+ doi = {10.1109/ICDEW.2014.6818339},
+ pages = {272--274},
+ publisher = {IEEE Computer Society},
+ title = {How to generate query parameters in RDF benchmarks?},
+ url = {https://doi.org/10.1109/ICDEW.2014.6818339}
+}
+
diff --git a/publication/dblp-conficde-gubichev-ab-14/index.html b/publication/dblp-conficde-gubichev-ab-14/index.html
new file mode 100644
index 00000000..daea6f9f
--- /dev/null
+++ b/publication/dblp-conficde-gubichev-ab-14/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>How to generate query parameters in RDF benchmarks?</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conficde-gubichev-ab-14/">How to generate query parameters in RDF benchmarks?</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev,
+  
+    Renzo Angles,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GDM at ICDE</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conficde-gubichev-ab-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1109/ICDEW.2014.6818339" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1109/ICDEW.2014.6818339" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conficde-pham-13/cite.bib b/publication/dblp-conficde-pham-13/cite.bib
new file mode 100644
index 00000000..db6b98ac
--- /dev/null
+++ b/publication/dblp-conficde-pham-13/cite.bib
@@ -0,0 +1,12 @@
+@inproceedings{DBLP:conf/icde/Pham13,
+ author = {Pham, Minh-Duc},
+ booktitle = {GDM at ICDE},
+ date = {2013},
+ doi = {10.1109/ICDEW.2013.6547471},
+ editor = {Chan, Chee Yong and Lu, Jiaheng and Nørvåg, Kjetil and Tanin, Egemen},
+ pages = {310--313},
+ publisher = {IEEE Computer Society},
+ title = {Self-organizing structured RDF in MonetDB},
+ url = {https://doi.org/10.1109/ICDEW.2013.6547471}
+}
+
diff --git a/publication/dblp-conficde-pham-13/index.html b/publication/dblp-conficde-pham-13/index.html
new file mode 100644
index 00000000..abca21c2
--- /dev/null
+++ b/publication/dblp-conficde-pham-13/index.html
@@ -0,0 +1,534 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Self organizing structured RDF in MonetDB</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conficde-pham-13/">Self-organizing structured RDF in MonetDB</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Minh-Duc Pham
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GDM at ICDE</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conficde-pham-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1109/ICDEW.2013.6547471" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1109/ICDEW.2013.6547471" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confrweb-larriba-pey-md-14/cite.bib b/publication/dblp-confrweb-larriba-pey-md-14/cite.bib
new file mode 100644
index 00000000..8c43e545
--- /dev/null
+++ b/publication/dblp-confrweb-larriba-pey-md-14/cite.bib
@@ -0,0 +1,13 @@
+@inproceedings{DBLP:conf/rweb/Larriba-PeyMD14,
+ author = {Larriba-Pey, Josep Lluı́s and Martı́nez-Bazan, Norbert and Domı́nguez-Sal, David},
+ booktitle = {Reasoning Web. Reasoning on the Web in the Big Data Era - 10th International Summer School 2014, Athens, Greece, September 8-13, 2014. Proceedings},
+ date = {2014},
+ doi = {10.1007/978-3-319-10587-1_4},
+ pages = {171--194},
+ publisher = {Springer},
+ series = {Lecture Notes in Computer Science},
+ title = {Introduction to Graph Databases},
+ url = {https://doi.org/10.1007/978-3-319-10587-1_4},
+ volume = {8714}
+}
+
diff --git a/publication/dblp-confrweb-larriba-pey-md-14/index.html b/publication/dblp-confrweb-larriba-pey-md-14/index.html
new file mode 100644
index 00000000..bf82e7e0
--- /dev/null
+++ b/publication/dblp-confrweb-larriba-pey-md-14/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Introduction to Graph Databases</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confrweb-larriba-pey-md-14/">Introduction to Graph Databases</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Josep Lluı́s Larriba-Pey,
+  
+    Norbert Martı́nez-Bazan,
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Reasoning Web. Reasoning on the Web in the Big Data Era - 10th International Summer School 2014, Athens, Greece, September 8-13, 2014. Proceedings</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confrweb-larriba-pey-md-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-319-10587-1_4" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-319-10587-1_4" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsemweb-kotsev-mpefk-16/cite.bib b/publication/dblp-confsemweb-kotsev-mpefk-16/cite.bib
new file mode 100644
index 00000000..c234d7c8
--- /dev/null
+++ b/publication/dblp-confsemweb-kotsev-mpefk-16/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/semweb/KotsevMPEFK16,
+ author = {Kotsev, Venelin and Minadakis, Nikos and Papakonstantinou, Vassilis and Erling, Orri and Fundulaki, Irini and Kiryakov, Atanas},
+ booktitle = {BLINK at ISWC},
+ date = {2016},
+ publisher = {CEUR-WS.org},
+ series = {CEUR Workshop Proceedings},
+ title = {Benchmarking RDF Query Engines: The LDBC Semantic Publishing Benchmark},
+ url = {http://ceur-ws.org/Vol-1700/paper-01.pdf},
+ volume = {1700}
+}
+
diff --git a/publication/dblp-confsemweb-kotsev-mpefk-16/index.html b/publication/dblp-confsemweb-kotsev-mpefk-16/index.html
new file mode 100644
index 00000000..128921aa
--- /dev/null
+++ b/publication/dblp-confsemweb-kotsev-mpefk-16/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarking RDF Query Engines: The LDBC Semantic Publishing Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsemweb-kotsev-mpefk-16/">Benchmarking RDF Query Engines: The LDBC Semantic Publishing Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Venelin Kotsev,
+  
+    Nikos Minadakis,
+  
+    Vassilis Papakonstantinou,
+  
+    Orri Erling,
+  
+    Irini Fundulaki,
+  
+
+
+  and
+
+Atanas Kiryakov
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> BLINK at ISWC</div>
+  
+
+  <div><b>Publication year:</b> 2016</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://ceur-ws.org/Vol-1700/paper-01.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsemweb-kotsev-mpefk-16/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsemweb-phuoc-dpbef-12/cite.bib b/publication/dblp-confsemweb-phuoc-dpbef-12/cite.bib
new file mode 100644
index 00000000..6685475a
--- /dev/null
+++ b/publication/dblp-confsemweb-phuoc-dpbef-12/cite.bib
@@ -0,0 +1,13 @@
+@inproceedings{DBLP:conf/semweb/PhuocDPBEF12,
+ author = {Phuoc, Danh Le and Dao-Tran, Minh and Pham, Minh-Duc and Boncz, Peter A. and Eiter, Thomas and Fink, Michael},
+ booktitle = {ISWC},
+ date = {2012},
+ doi = {10.1007/978-3-642-35173-0_20},
+ pages = {300--312},
+ publisher = {Springer},
+ series = {Lecture Notes in Computer Science},
+ title = {Linked Stream Data Processing Engines: Facts and Figures},
+ url = {https://doi.org/10.1007/978-3-642-35173-0_20},
+ volume = {7650}
+}
+
diff --git a/publication/dblp-confsemweb-phuoc-dpbef-12/index.html b/publication/dblp-confsemweb-phuoc-dpbef-12/index.html
new file mode 100644
index 00000000..e02485ad
--- /dev/null
+++ b/publication/dblp-confsemweb-phuoc-dpbef-12/index.html
@@ -0,0 +1,548 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Linked Stream Data Processing Engines: Facts and Figures</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsemweb-phuoc-dpbef-12/">Linked Stream Data Processing Engines: Facts and Figures</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Danh Le Phuoc,
+  
+    Minh Dao-Tran,
+  
+    Minh-Duc Pham,
+  
+    Peter A. Boncz,
+  
+    Thomas Eiter,
+  
+
+
+  and
+
+Michael Fink
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> ISWC</div>
+  
+
+  <div><b>Publication year:</b> 2012</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsemweb-phuoc-dpbef-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-642-35173-0_20" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-642-35173-0_20" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-angles-abbfglpps-18/cite.bib b/publication/dblp-confsigmod-angles-abbfglpps-18/cite.bib
new file mode 100644
index 00000000..1bab7df1
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-abbfglpps-18/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/AnglesABBFGLPPS18,
+ author = {Angles, Renzo and Arenas, Marcelo and Barceló, Pablo and Boncz, Peter A. and Fletcher, George H. L. and Gutierrez, Claudio and Lindaaker, Tobias and Paradies, Marcus and Plantikow, Stefan and Sequeda, Juan F. and van Rest, Oskar and Voigt, Hannes},
+ booktitle = {SIGMOD},
+ date = {2018},
+ doi = {10.1145/3183713.3190654},
+ pages = {1421--1432},
+ publisher = {ACM},
+ title = {G-CORE: A Core for Future Graph Query Languages},
+ url = {http://doi.acm.org/10.1145/3183713.3190654}
+}
+
diff --git a/publication/dblp-confsigmod-angles-abbfglpps-18/index.html b/publication/dblp-confsigmod-angles-abbfglpps-18/index.html
new file mode 100644
index 00000000..24875185
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-abbfglpps-18/index.html
@@ -0,0 +1,560 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>G CORE: A Core for Future Graph Query Languages</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-angles-abbfglpps-18/">G-CORE: A Core for Future Graph Query Languages</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Marcelo Arenas,
+  
+    Pablo Barceló,
+  
+    Peter A. Boncz,
+  
+    George H. L. Fletcher,
+  
+    Claudio Gutierrez,
+  
+    Tobias Lindaaker,
+  
+    Marcus Paradies,
+  
+    Stefan Plantikow,
+  
+    Juan F. Sequeda,
+  
+    Oskar van Rest,
+  
+
+
+  and
+
+Hannes Voigt
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2018</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-abbfglpps-18/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3183713.3190654" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="http://doi.acm.org/10.1145/3183713.3190654" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-angles-bdfhhlllm-21/cite.bib b/publication/dblp-confsigmod-angles-bdfhhlllm-21/cite.bib
new file mode 100644
index 00000000..5d17bf67
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-bdfhhlllm-21/cite.bib
@@ -0,0 +1,30 @@
+@inproceedings{DBLP:conf/sigmod/AnglesBDFHHLLLM21,
+ author = {Renzo Angles and
+Angela Bonifati and
+Stefania Dumbrava and
+George Fletcher and
+Keith W. Hare and
+Jan Hidders and
+Victor E. Lee and
+Bei Li and
+Leonid Libkin and
+Wim Martens and
+Filip Murlak and
+Josh Perryman and
+Ognjen Savkovic and
+Michael Schmidt and
+Juan F. Sequeda and
+Slawek Staworko and
+Dominik Tomaszuk},
+ bibsource = {dblp computer science bibliography, https://dblp.org},
+ biburl = {https://dblp.org/rec/conf/sigmod/AnglesBDFHHLLLM21.bib},
+ booktitle = {SIGMOD},
+ doi = {10.1145/3448016.3457561},
+ pages = {2423--2436},
+ publisher = {ACM},
+ timestamp = {Mon, 03 Jan 2022 22:24:52 +0100},
+ title = {PG-Keys: Keys for Property Graphs},
+ url = {https://doi.org/10.1145/3448016.3457561},
+ year = {2021}
+}
+
diff --git a/publication/dblp-confsigmod-angles-bdfhhlllm-21/index.html b/publication/dblp-confsigmod-angles-bdfhhlllm-21/index.html
new file mode 100644
index 00000000..ce41b137
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-bdfhhlllm-21/index.html
@@ -0,0 +1,570 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>PG Keys: Keys for Property Graphs</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-angles-bdfhhlllm-21/">PG-Keys: Keys for Property Graphs</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Angela Bonifati,
+  
+    Stefania Dumbrava,
+  
+    George Fletcher,
+  
+    Keith W. Hare,
+  
+    Jan Hidders,
+  
+    Victor E. Lee,
+  
+    Bei Li,
+  
+    Leonid Libkin,
+  
+    Wim Martens,
+  
+    Filip Murlak,
+  
+    Josh Perryman,
+  
+    Ognjen Savkovic,
+  
+    Michael Schmidt,
+  
+    Juan F. Sequeda,
+  
+    Slawek Staworko,
+  
+
+
+  and
+
+Dominik Tomaszuk
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2021</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-bdfhhlllm-21/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3448016.3457561" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3448016.3457561" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-angles-pdl-13/cite.bib b/publication/dblp-confsigmod-angles-pdl-13/cite.bib
new file mode 100644
index 00000000..0f3bb455
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-pdl-13/cite.bib
@@ -0,0 +1,10 @@
+@inproceedings{DBLP:conf/sigmod/AnglesPDL13,
+ author = {Angles, Renzo and Prat-Pérez, Arnau and Dominguez-Sal, David and Larriba-Pey, Josep Lluı́s},
+ booktitle = {GRADES at SIGMOD},
+ date = {2013},
+ doi = {10.1145/2484425.2484440},
+ publisher = {CWI/ACM},
+ title = {Benchmarking database systems for social network applications},
+ url = {http://event.cwi.nl/grades2013/15-Angles.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-angles-pdl-13/index.html b/publication/dblp-confsigmod-angles-pdl-13/index.html
new file mode 100644
index 00000000..0f210c4a
--- /dev/null
+++ b/publication/dblp-confsigmod-angles-pdl-13/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarking database systems for social network applications</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-angles-pdl-13/">Benchmarking database systems for social network applications</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Arnau Prat-Pérez,
+  
+    David Dominguez-Sal,
+  
+
+
+  and
+
+Josep Lluı́s Larriba-Pey
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://event.cwi.nl/grades2013/15-Angles.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-pdl-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2484425.2484440" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-cattuto-qpa-13/cite.bib b/publication/dblp-confsigmod-cattuto-qpa-13/cite.bib
new file mode 100644
index 00000000..cc78efa2
--- /dev/null
+++ b/publication/dblp-confsigmod-cattuto-qpa-13/cite.bib
@@ -0,0 +1,10 @@
+@inproceedings{DBLP:conf/sigmod/CattutoQPA13,
+ author = {Cattuto, Ciro and Quaggiotto, Marco and Panisson, André and Averbuch, Alex},
+ booktitle = {GRADES at SIGMOD},
+ date = {2013},
+ doi = {10.1145/2484425.2484442},
+ publisher = {CWI/ACM},
+ title = {Time-varying social networks in a graph database: a Neo4j use case},
+ url = {http://event.cwi.nl/grades2013/11-averbuch.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-cattuto-qpa-13/index.html b/publication/dblp-confsigmod-cattuto-qpa-13/index.html
new file mode 100644
index 00000000..780f9ef8
--- /dev/null
+++ b/publication/dblp-confsigmod-cattuto-qpa-13/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Time varying social networks in a graph database: a Neo4j use case</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-cattuto-qpa-13/">Time-varying social networks in a graph database: a Neo4j use case</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Ciro Cattuto,
+  
+    Marco Quaggiotto,
+  
+    André Panisson,
+  
+
+
+  and
+
+Alex Averbuch
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://event.cwi.nl/grades2013/11-averbuch.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-cattuto-qpa-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2484425.2484442" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-erling-alcgppb-15/cite.bib b/publication/dblp-confsigmod-erling-alcgppb-15/cite.bib
new file mode 100644
index 00000000..bdc571db
--- /dev/null
+++ b/publication/dblp-confsigmod-erling-alcgppb-15/cite.bib
@@ -0,0 +1,10 @@
+@inproceedings{DBLP:conf/sigmod/ErlingALCGPPB15,
+ author = {Erling, Orri and Averbuch, Alex and Larriba-Pey, Josep-Lluis and Chafi, Hassan and Gubichev, Andrey and Prat-Pérez, Arnau and Pham, Minh-Duc and Boncz, Peter A.},
+ booktitle = {SIGMOD},
+ date = {2015},
+ doi = {10.1145/2723372.2742786},
+ pages = {619--630},
+ title = {The LDBC Social Network Benchmark: Interactive Workload},
+ url = {https://ldbcouncil.org/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-erling-alcgppb-15/index.html b/publication/dblp-confsigmod-erling-alcgppb-15/index.html
new file mode 100644
index 00000000..d0443551
--- /dev/null
+++ b/publication/dblp-confsigmod-erling-alcgppb-15/index.html
@@ -0,0 +1,546 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Social Network Benchmark: Interactive Workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-erling-alcgppb-15/">The LDBC Social Network Benchmark: Interactive Workload</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Orri Erling,
+  
+    Alex Averbuch,
+  
+    Josep-Lluis Larriba-Pey,
+  
+    Hassan Chafi,
+  
+    Andrey Gubichev,
+  
+    Arnau Prat-Pérez,
+  
+    Minh-Duc Pham,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2015</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-erling-alcgppb-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2723372.2742786" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-gubichev-bs-13/cite.bib b/publication/dblp-confsigmod-gubichev-bs-13/cite.bib
new file mode 100644
index 00000000..6050b14f
--- /dev/null
+++ b/publication/dblp-confsigmod-gubichev-bs-13/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/GubichevBS13,
+ author = {Gubichev, Andrey and Bedathur, Srikanta J. and Seufert, Stephan},
+ booktitle = {First International Workshop on Graph Data Management Experiences and Systems, GRADES 2013, co-located with SIGMOD/PODS 2013, New York, NY, USA, June 24, 2013},
+ date = {2013},
+ doi = {10.1145/2484425.2484443},
+ pages = {14},
+ publisher = {CWI/ACM},
+ title = {Sparqling Kleene: fast property paths in RDF-3X},
+ url = {http://event.cwi.nl/grades2013/14-gubichev.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-gubichev-bs-13/index.html b/publication/dblp-confsigmod-gubichev-bs-13/index.html
new file mode 100644
index 00000000..934e2525
--- /dev/null
+++ b/publication/dblp-confsigmod-gubichev-bs-13/index.html
@@ -0,0 +1,536 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Sparqling Kleene: fast property paths in RDF 3X</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-gubichev-bs-13/">Sparqling Kleene: fast property paths in RDF-3X</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev,
+  
+    Srikanta J. Bedathur,
+  
+
+
+  and
+
+Stephan Seufert
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> First International Workshop on Graph Data Management Experiences and Systems, GRADES 2013, co-located with SIGMOD/PODS 2013, New York, NY, USA, June 24, 2013</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://event.cwi.nl/grades2013/14-gubichev.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-gubichev-bs-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2484425.2484443" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-gubichev-t-14/cite.bib b/publication/dblp-confsigmod-gubichev-t-14/cite.bib
new file mode 100644
index 00000000..c6d8dd3b
--- /dev/null
+++ b/publication/dblp-confsigmod-gubichev-t-14/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/GubichevT14,
+ author = {Gubichev, Andrey and Then, Manuel},
+ booktitle = {GRADES at SIGMOD},
+ date = {2014},
+ doi = {10.1145/2621934.2621944},
+ pages = {8:1--8:7},
+ publisher = {CWI/ACM},
+ title = {Graph Pattern Matching - Do We Have to Reinvent the Wheel?},
+ url = {https://doi.org/10.1145/2621934.2621944}
+}
+
diff --git a/publication/dblp-confsigmod-gubichev-t-14/index.html b/publication/dblp-confsigmod-gubichev-t-14/index.html
new file mode 100644
index 00000000..804bff5c
--- /dev/null
+++ b/publication/dblp-confsigmod-gubichev-t-14/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Graph Pattern Matching   Do We Have to Reinvent the Wheel?</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-gubichev-t-14/">Graph Pattern Matching - Do We Have to Reinvent the Wheel?</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Manuel Then
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-gubichev-t-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621944" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621944" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-guisado-gamez-p-14/cite.bib b/publication/dblp-confsigmod-guisado-gamez-p-14/cite.bib
new file mode 100644
index 00000000..11905893
--- /dev/null
+++ b/publication/dblp-confsigmod-guisado-gamez-p-14/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/Guisado-GamezP14,
+ author = {Guisado-Gámez, Joan and Prat-Pérez, Arnau},
+ booktitle = {GRADES at SIGMOD},
+ date = {2015},
+ doi = {10.1145/2764947.2764953},
+ pages = {6:1--6:6},
+ publisher = {ACM},
+ title = {Understanding Graph Structure of Wikipedia for Query Expansion},
+ url = {https://doi.org/10.1145/2764947.2764953}
+}
+
diff --git a/publication/dblp-confsigmod-guisado-gamez-p-14/index.html b/publication/dblp-confsigmod-guisado-gamez-p-14/index.html
new file mode 100644
index 00000000..a4dea5f6
--- /dev/null
+++ b/publication/dblp-confsigmod-guisado-gamez-p-14/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Understanding Graph Structure of Wikipedia for Query Expansion</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-guisado-gamez-p-14/">Understanding Graph Structure of Wikipedia for Query Expansion</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Joan Guisado-Gámez
+  
+
+
+  and
+
+Arnau Prat-Pérez
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2015</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-guisado-gamez-p-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2764947.2764953" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2764947.2764953" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-ma-wqyxz-13/cite.bib b/publication/dblp-confsigmod-ma-wqyxz-13/cite.bib
new file mode 100644
index 00000000..2db60d82
--- /dev/null
+++ b/publication/dblp-confsigmod-ma-wqyxz-13/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/MaWQYXZ13,
+ author = {Ma, Haixin and Wei, Jinxian and Qian, Weining and Yu, Chengcheng and Xia, Fan and Zhou, Aoying},
+ booktitle = {GRADES at SIGMOD},
+ date = {2013},
+ doi = {10.1145/2484425.2484435},
+ pages = {10},
+ publisher = {CWI/ACM},
+ title = {On benchmarking online social media analytical queries},
+ url = {http://event.cwi.nl/grades2013/10-Ma.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-ma-wqyxz-13/index.html b/publication/dblp-confsigmod-ma-wqyxz-13/index.html
new file mode 100644
index 00000000..0767c12a
--- /dev/null
+++ b/publication/dblp-confsigmod-ma-wqyxz-13/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>On benchmarking online social media analytical queries</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-ma-wqyxz-13/">On benchmarking online social media analytical queries</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Haixin Ma,
+  
+    Jinxian Wei,
+  
+    Weining Qian,
+  
+    Chengcheng Yu,
+  
+    Fan Xia,
+  
+
+
+  and
+
+Aoying Zhou
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://event.cwi.nl/grades2013/10-Ma.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-ma-wqyxz-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2484425.2484435" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-martinez-bazan-d-14/cite.bib b/publication/dblp-confsigmod-martinez-bazan-d-14/cite.bib
new file mode 100644
index 00000000..715c1cb9
--- /dev/null
+++ b/publication/dblp-confsigmod-martinez-bazan-d-14/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/Martinez-BazanD14,
+ author = {Martı́nez-Bazan, Norbert and Domı́nguez-Sal, David},
+ booktitle = {GRADES at SIGMOD},
+ date = {2014},
+ doi = {10.1145/2621934.2621943},
+ pages = {6:1--6:6},
+ publisher = {CWI/ACM},
+ title = {Using semijoin programs to solve traversal queries in graph databases},
+ url = {https://doi.org/10.1145/2621934.2621943}
+}
+
diff --git a/publication/dblp-confsigmod-martinez-bazan-d-14/index.html b/publication/dblp-confsigmod-martinez-bazan-d-14/index.html
new file mode 100644
index 00000000..f291c49e
--- /dev/null
+++ b/publication/dblp-confsigmod-martinez-bazan-d-14/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Using semijoin programs to solve traversal queries in graph databases</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-martinez-bazan-d-14/">Using semijoin programs to solve traversal queries in graph databases</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Norbert Martı́nez-Bazan
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-martinez-bazan-d-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621943" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621943" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-prat-d-14/cite.bib b/publication/dblp-confsigmod-prat-d-14/cite.bib
new file mode 100644
index 00000000..ccc8ee28
--- /dev/null
+++ b/publication/dblp-confsigmod-prat-d-14/cite.bib
@@ -0,0 +1,12 @@
+@inproceedings{DBLP:conf/sigmod/PratD14,
+ author = {Prat-Pérez, Arnau and Domı́nguez-Sal, David},
+ booktitle = {GRADES at SIGMOD},
+ date = {2014},
+ doi = {10.1145/2621934.2621942},
+ editor = {Boncz, Peter A. and Larriba-Pey, Josep Lluı́s},
+ pages = {7:1--7:9},
+ publisher = {CWI/ACM},
+ title = {How community-like is the structure of synthetically generated graphs?},
+ url = {https://doi.org/10.1145/2621934.2621942}
+}
+
diff --git a/publication/dblp-confsigmod-prat-d-14/index.html b/publication/dblp-confsigmod-prat-d-14/index.html
new file mode 100644
index 00000000..31b81dc2
--- /dev/null
+++ b/publication/dblp-confsigmod-prat-d-14/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>How community like is the structure of synthetically generated graphs?</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-prat-d-14/">How community-like is the structure of synthetically generated graphs?</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-prat-d-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621942" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2621934.2621942" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confsigmod-waudby-sps-20/cite.bib b/publication/dblp-confsigmod-waudby-sps-20/cite.bib
new file mode 100644
index 00000000..a9eb6bcb
--- /dev/null
+++ b/publication/dblp-confsigmod-waudby-sps-20/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/sigmod/WaudbySPS20,
+ author = {Waudby, Jack and Steer, Benjamin A. and Prat-Pérez, Arnau and Szárnyas, Gábor},
+ booktitle = {GRADES-NDA at SIGMOD},
+ date = {2020},
+ doi = {10.1145/3398682.3399165},
+ pages = {8:1--8:8},
+ publisher = {ACM},
+ title = {Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark's Data Generator},
+ url = {https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf}
+}
+
diff --git a/publication/dblp-confsigmod-waudby-sps-20/index.html b/publication/dblp-confsigmod-waudby-sps-20/index.html
new file mode 100644
index 00000000..62fef246
--- /dev/null
+++ b/publication/dblp-confsigmod-waudby-sps-20/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&#39;s Data Generator</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confsigmod-waudby-sps-20/">Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&#39;s Data Generator</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Arnau Prat-Pérez,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> GRADES-NDA at SIGMOD</div>
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/datagen-deletes-grades-nda-2020.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-waudby-sps-20/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/3398682.3399165" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conftpctc-boncz-ne-13/cite.bib b/publication/dblp-conftpctc-boncz-ne-13/cite.bib
new file mode 100644
index 00000000..a37d1f57
--- /dev/null
+++ b/publication/dblp-conftpctc-boncz-ne-13/cite.bib
@@ -0,0 +1,13 @@
+@inproceedings{DBLP:conf/tpctc/BonczNE13,
+ annote = {https://web.archive.org/web/20230724043058/https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf},
+ author = {Boncz, Peter A. and Neumann, Thomas and Erling, Orri},
+ booktitle = {TPCTC},
+ date = {2013},
+ doi = {10.1007/978-3-319-04936-6_5},
+ pages = {61--76},
+ publisher = {Springer},
+ title = {TPC-H Analyzed: Hidden Messages and Lessons Learned from an Influential Benchmark},
+ url = {https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf},
+ volume = {8391}
+}
+
diff --git a/publication/dblp-conftpctc-boncz-ne-13/index.html b/publication/dblp-conftpctc-boncz-ne-13/index.html
new file mode 100644
index 00000000..cea1e09c
--- /dev/null
+++ b/publication/dblp-conftpctc-boncz-ne-13/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>TPC H Analyzed: Hidden Messages and Lessons Learned from an Influential Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conftpctc-boncz-ne-13/">TPC-H Analyzed: Hidden Messages and Lessons Learned from an Influential Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Thomas Neumann,
+  
+
+
+  and
+
+Orri Erling
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-boncz-ne-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-319-04936-6_5" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230724043058/https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conftpctc-gubichev-b-14/cite.bib b/publication/dblp-conftpctc-gubichev-b-14/cite.bib
new file mode 100644
index 00000000..78bbcf53
--- /dev/null
+++ b/publication/dblp-conftpctc-gubichev-b-14/cite.bib
@@ -0,0 +1,14 @@
+@inproceedings{DBLP:conf/tpctc/GubichevB14,
+ annote = {https://web.archive.org/web/20230724043030/https://ldbcouncil.org/docs/papers/parameter-curation-tpctc2014.pdf},
+ author = {Gubichev, Andrey and Boncz, Peter A.},
+ booktitle = {TPCTC},
+ date = {2014},
+ doi = {10.1007/978-3-319-15350-6_8},
+ pages = {113--129},
+ publisher = {Springer},
+ series = {Lecture Notes in Computer Science},
+ title = {Parameter Curation for Benchmark Queries},
+ url = {https://doi.org/10.1007/978-3-319-15350-6_8},
+ volume = {8904}
+}
+
diff --git a/publication/dblp-conftpctc-gubichev-b-14/index.html b/publication/dblp-conftpctc-gubichev-b-14/index.html
new file mode 100644
index 00000000..e58dc269
--- /dev/null
+++ b/publication/dblp-conftpctc-gubichev-b-14/index.html
@@ -0,0 +1,544 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Parameter Curation for Benchmark Queries</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conftpctc-gubichev-b-14/">Parameter Curation for Benchmark Queries</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-gubichev-b-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-319-15350-6_8" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230724043030/https://ldbcouncil.org/docs/papers/parameter-curation-tpctc2014.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-319-15350-6_8" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conftpctc-pham-be-12/cite.bib b/publication/dblp-conftpctc-pham-be-12/cite.bib
new file mode 100644
index 00000000..70db8fe8
--- /dev/null
+++ b/publication/dblp-conftpctc-pham-be-12/cite.bib
@@ -0,0 +1,13 @@
+@inproceedings{DBLP:conf/tpctc/PhamBE12,
+ author = {Pham, Minh-Duc and Boncz, Peter A. and Erling, Orri},
+ booktitle = {TPCTC},
+ doi = {10.1007/978-3-642-36727-4_11},
+ pages = {156--172},
+ publisher = {Springer},
+ series = {Lecture Notes in Computer Science},
+ title = {S3G2: A Scalable Structure-Correlated Social Graph Generator},
+ url = {https://doi.org/10.1007/978-3-642-36727-4_11},
+ volume = {7755},
+ year = {2012}
+}
+
diff --git a/publication/dblp-conftpctc-pham-be-12/index.html b/publication/dblp-conftpctc-pham-be-12/index.html
new file mode 100644
index 00000000..b4a1ee18
--- /dev/null
+++ b/publication/dblp-conftpctc-pham-be-12/index.html
@@ -0,0 +1,546 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>S3G2: A Scalable Structure Correlated Social Graph Generator</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conftpctc-pham-be-12/">S3G2: A Scalable Structure-Correlated Social Graph Generator</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Minh-Duc Pham,
+  
+    Peter A. Boncz,
+  
+
+
+  and
+
+Orri Erling
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2012</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-pham-be-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-642-36727-4_11" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230724043113/https://ldbcouncil.org/docs/papers/s3g2-scalable-data-generator-tpctc2012.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-642-36727-4_11" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-conftpctc-waudby-skmbs-20/cite.bib b/publication/dblp-conftpctc-waudby-skmbs-20/cite.bib
new file mode 100644
index 00000000..c10ad12b
--- /dev/null
+++ b/publication/dblp-conftpctc-waudby-skmbs-20/cite.bib
@@ -0,0 +1,22 @@
+@inproceedings{DBLP:conf/tpctc/WaudbySKMBS20,
+ annote = {https://web.archive.org/web/20230724043134/https://ldbcouncil.org/docs/papers/ldbc-acid-tpctc2020.pdf},
+ author = {Jack Waudby and
+Benjamin A. Steer and
+Karim Karimov and
+József Marton and
+Peter A. Boncz and
+Gábor Szárnyas},
+ bibsource = {dblp computer science bibliography, https://dblp.org},
+ biburl = {https://dblp.org/rec/conf/tpctc/WaudbySKMBS20.bib},
+ booktitle = {TPCTC},
+ doi = {10.1007/978-3-030-84924-5_1},
+ pages = {1--17},
+ publisher = {Springer},
+ series = {Lecture Notes in Computer Science},
+ timestamp = {Fri, 06 Aug 2021 15:44:31 +0200},
+ title = {Towards Testing ACID Compliance in the LDBC Social Network Benchmark},
+ url = {https://doi.org/10.1007/978-3-030-84924-5_1},
+ volume = {12752},
+ year = {2020}
+}
+
diff --git a/publication/dblp-conftpctc-waudby-skmbs-20/index.html b/publication/dblp-conftpctc-waudby-skmbs-20/index.html
new file mode 100644
index 00000000..27e9530e
--- /dev/null
+++ b/publication/dblp-conftpctc-waudby-skmbs-20/index.html
@@ -0,0 +1,552 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Towards Testing ACID Compliance in the LDBC Social Network Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-conftpctc-waudby-skmbs-20/">Towards Testing ACID Compliance in the LDBC Social Network Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Karim Karimov,
+  
+    József Marton,
+  
+    Peter A. Boncz,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-waudby-skmbs-20/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-030-84924-5_1" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230724043134/https://ldbcouncil.org/docs/papers/ldbc-acid-tpctc2020.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/978-3-030-84924-5_1" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confwww-pham-peb-15/cite.bib b/publication/dblp-confwww-pham-peb-15/cite.bib
new file mode 100644
index 00000000..6ad4ee6c
--- /dev/null
+++ b/publication/dblp-confwww-pham-peb-15/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/www/PhamPEB15,
+ author = {Pham, Minh-Duc and Passing, Linnea and Erling, Orri and Boncz, Peter A.},
+ booktitle = {WWW},
+ date = {2015},
+ doi = {10.1145/2736277.2741121},
+ pages = {864--874},
+ publisher = {ACM},
+ title = {Deriving an Emergent Relational Schema from RDF Data},
+ url = {https://doi.org/10.1145/2736277.2741121}
+}
+
diff --git a/publication/dblp-confwww-pham-peb-15/index.html b/publication/dblp-confwww-pham-peb-15/index.html
new file mode 100644
index 00000000..020c7a99
--- /dev/null
+++ b/publication/dblp-confwww-pham-peb-15/index.html
@@ -0,0 +1,544 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Deriving an Emergent Relational Schema from RDF Data</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confwww-pham-peb-15/">Deriving an Emergent Relational Schema from RDF Data</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Minh-Duc Pham,
+  
+    Linnea Passing,
+  
+    Orri Erling,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> WWW</div>
+  
+
+  <div><b>Publication year:</b> 2015</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confwww-pham-peb-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2736277.2741121" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2736277.2741121" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-confwww-prat-perez-dl-14/cite.bib b/publication/dblp-confwww-prat-perez-dl-14/cite.bib
new file mode 100644
index 00000000..103cf4ef
--- /dev/null
+++ b/publication/dblp-confwww-prat-perez-dl-14/cite.bib
@@ -0,0 +1,11 @@
+@inproceedings{DBLP:conf/www/Prat-PerezDL14,
+ author = {Prat-Pérez, Arnau and Dominguez-Sal, David and Larriba-Pey, Josep Lluı́s},
+ booktitle = {WWW},
+ date = {2014},
+ doi = {10.1145/2566486.2568010},
+ pages = {225--236},
+ publisher = {ACM},
+ title = {High quality, scalable and parallel community detection for large real graphs},
+ url = {https://doi.org/10.1145/2566486.2568010}
+}
+
diff --git a/publication/dblp-confwww-prat-perez-dl-14/index.html b/publication/dblp-confwww-prat-perez-dl-14/index.html
new file mode 100644
index 00000000..f541850b
--- /dev/null
+++ b/publication/dblp-confwww-prat-perez-dl-14/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>High quality, scalable and parallel community detection for large real graphs</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-confwww-prat-perez-dl-14/">High quality, scalable and parallel community detection for large real graphs</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez,
+  
+    David Dominguez-Sal,
+  
+
+
+  and
+
+Josep Lluı́s Larriba-Pey
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> WWW</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confwww-prat-perez-dl-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2566486.2568010" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2566486.2568010" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-1301-5121/cite.bib b/publication/dblp-journalscorrabs-1301-5121/cite.bib
new file mode 100644
index 00000000..16470de9
--- /dev/null
+++ b/publication/dblp-journalscorrabs-1301-5121/cite.bib
@@ -0,0 +1,11 @@
+@article{DBLP:journals/corr/abs-1301-5121,
+ author = {Averbuch, Alex and Neumann, Martin},
+ date = {2013},
+ eprint = {1301.5121},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ title = {Partitioning Graph Databases - A Quantitative Evaluation},
+ url = {http://arxiv.org/pdf/1301.5121.pdf},
+ volume = {abs/1301.5121}
+}
+
diff --git a/publication/dblp-journalscorrabs-1301-5121/index.html b/publication/dblp-journalscorrabs-1301-5121/index.html
new file mode 100644
index 00000000..61511e22
--- /dev/null
+++ b/publication/dblp-journalscorrabs-1301-5121/index.html
@@ -0,0 +1,530 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Partitioning Graph Databases   A Quantitative Evaluation</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-1301-5121/">Partitioning Graph Databases - A Quantitative Evaluation</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Alex Averbuch
+  
+
+
+  and
+
+Martin Neumann
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://arxiv.org/pdf/1301.5121.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-1301-5121/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-2001-02299/cite.bib b/publication/dblp-journalscorrabs-2001-02299/cite.bib
new file mode 100644
index 00000000..2c9c736d
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2001-02299/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/corr/abs-2001-02299,
+ author = {Renzo Angles and János Benjamin Antal and Alex Averbuch and Altan Birler and Peter Boncz and Márton Búr and Orri Erling and Andrey Gubichev and Vlad Haprian and Moritz Kaufmann and Josep Lluís Larriba Pey and Norbert Martínez and József Marton and Marcus Paradies and Minh-Duc Pham and Arnau Prat-Pérez and David Püroja and Mirko Spasić and Benjamin A. Steer and Dávid Szakállas and Gábor Szárnyas and Jack Waudby and Mingxi Wu and Yuchen Zhang},
+ date = {2020},
+ doi = {https://doi.org/10.48550/arXiv.2001.02299},
+ eprint = {2001.02299},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ title = {The LDBC Social Network Benchmark},
+ url = {http://arxiv.org/pdf/2001.02299.pdf},
+ volume = {abs/2001.02299}
+}
+
diff --git a/publication/dblp-journalscorrabs-2001-02299/index.html b/publication/dblp-journalscorrabs-2001-02299/index.html
new file mode 100644
index 00000000..165965fa
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2001-02299/index.html
@@ -0,0 +1,578 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Social Network Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-2001-02299/">The LDBC Social Network Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    János Benjamin Antal,
+  
+    Alex Averbuch,
+  
+    Altan Birler,
+  
+    Peter Boncz,
+  
+    Márton Búr,
+  
+    Orri Erling,
+  
+    Andrey Gubichev,
+  
+    Vlad Haprian,
+  
+    Moritz Kaufmann,
+  
+    Josep Lluís Larriba Pey,
+  
+    Norbert Martínez,
+  
+    József Marton,
+  
+    Marcus Paradies,
+  
+    Minh-Duc Pham,
+  
+    Arnau Prat-Pérez,
+  
+    David Püroja,
+  
+    Mirko Spasić,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Gábor Szárnyas,
+  
+    Jack Waudby,
+  
+    Mingxi Wu,
+  
+
+
+  and
+
+Yuchen Zhang
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://arxiv.org/pdf/2001.02299.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2001-02299/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2001.02299" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-2010-12243/cite.bib b/publication/dblp-journalscorrabs-2010-12243/cite.bib
new file mode 100644
index 00000000..7f2d464d
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2010-12243/cite.bib
@@ -0,0 +1,11 @@
+@article{DBLP:journals/corr/abs-2010-12243,
+ author = {Elekes, Márton and Antal, János Benjamin and Szárnyas, Gábor},
+ date = {2020},
+ eprint = {2010.12243},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ title = {An analysis of the SIGMOD 2014 Programming Contest: Complex queries on the LDBC social network graph},
+ url = {https://arxiv.org/pdf/2010.12243.pdf},
+ volume = {abs/2010.12243}
+}
+
diff --git a/publication/dblp-journalscorrabs-2010-12243/index.html b/publication/dblp-journalscorrabs-2010-12243/index.html
new file mode 100644
index 00000000..4df93d97
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2010-12243/index.html
@@ -0,0 +1,532 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>An analysis of the SIGMOD 2014 Programming Contest: Complex queries on the LDBC social network graph</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-2010-12243/">An analysis of the SIGMOD 2014 Programming Contest: Complex queries on the LDBC social network graph</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Márton Elekes,
+  
+    János Benjamin Antal,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://arxiv.org/pdf/2010.12243.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2010-12243/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-2011-15028/cite.bib b/publication/dblp-journalscorrabs-2011-15028/cite.bib
new file mode 100644
index 00000000..d098d8fc
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2011-15028/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/corr/abs-2011-15028,
+ author = {Iosup, Alexandru and Musaafir, Ahmed and Uta, Alexandru and Prat-Pérez, Arnau and Szárnyas, Gábor and Chafi, Hassan and Tanase, Ilie Gabriel and Nai, Lifeng and Anderson, Michael J. and Capota, Mihai and Sundaram, Narayanan and Boncz, Peter A. and Depner, Siegfried and Heldens, Stijn and Manhardt, Thomas and Hegeman, Tim and Ngai, Wing Lung and Xia, Yinglong},
+ date = {2020},
+ doi = {https://doi.org/10.48550/arXiv.2011.15028},
+ eprint = {2011.15028},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ title = {The LDBC Graphalytics Benchmark},
+ url = {https://arxiv.org/pdf/2011.15028.pdf},
+ volume = {abs/2011.15028}
+}
+
diff --git a/publication/dblp-journalscorrabs-2011-15028/index.html b/publication/dblp-journalscorrabs-2011-15028/index.html
new file mode 100644
index 00000000..84745a5e
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2011-15028/index.html
@@ -0,0 +1,566 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Graphalytics Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-2011-15028/">The LDBC Graphalytics Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Alexandru Iosup,
+  
+    Ahmed Musaafir,
+  
+    Alexandru Uta,
+  
+    Arnau Prat-Pérez,
+  
+    Gábor Szárnyas,
+  
+    Hassan Chafi,
+  
+    Ilie Gabriel Tanase,
+  
+    Lifeng Nai,
+  
+    Michael J. Anderson,
+  
+    Mihai Capota,
+  
+    Narayanan Sundaram,
+  
+    Peter A. Boncz,
+  
+    Siegfried Depner,
+  
+    Stijn Heldens,
+  
+    Thomas Manhardt,
+  
+    Tim Hegeman,
+  
+    Wing Lung Ngai,
+  
+
+
+  and
+
+Yinglong Xia
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://arxiv.org/pdf/2011.15028.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2011-15028/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2011.15028" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-2112-06217/cite.bib b/publication/dblp-journalscorrabs-2112-06217/cite.bib
new file mode 100644
index 00000000..f3022834
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2112-06217/cite.bib
@@ -0,0 +1,31 @@
+@article{DBLP:journals/corr/abs-2112-06217,
+ author = {Alin Deutsch and
+Nadime Francis and
+Alastair Green and
+Keith Hare and
+Bei Li and
+Leonid Libkin and
+Tobias Lindaaker and
+Victor Marsault and
+Wim Martens and
+Jan Michels and
+Filip Murlak and
+Stefan Plantikow and
+Petra Selmer and
+Hannes Voigt and
+Oskar van Rest and
+Domagoj Vrgoc and
+Mingxi Wu and
+Fred Zemke},
+ bibsource = {dblp computer science bibliography, https://dblp.org},
+ biburl = {https://dblp.org/rec/journals/corr/abs-2112-06217.bib},
+ eprint = {2112.06217},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ timestamp = {Mon, 03 Jan 2022 15:45:35 +0100},
+ title = {Graph Pattern Matching in GQL and SQL/PGQ},
+ url = {https://arxiv.org/abs/2112.06217},
+ volume = {abs/2112.06217},
+ year = {2021}
+}
+
diff --git a/publication/dblp-journalscorrabs-2112-06217/index.html b/publication/dblp-journalscorrabs-2112-06217/index.html
new file mode 100644
index 00000000..08884914
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2112-06217/index.html
@@ -0,0 +1,568 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Graph Pattern Matching in GQL and SQL/PGQ</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-2112-06217/">Graph Pattern Matching in GQL and SQL/PGQ</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Alin Deutsch,
+  
+    Nadime Francis,
+  
+    Alastair Green,
+  
+    Keith Hare,
+  
+    Bei Li,
+  
+    Leonid Libkin,
+  
+    Tobias Lindaaker,
+  
+    Victor Marsault,
+  
+    Wim Martens,
+  
+    Jan Michels,
+  
+    Filip Murlak,
+  
+    Stefan Plantikow,
+  
+    Petra Selmer,
+  
+    Hannes Voigt,
+  
+    Oskar van Rest,
+  
+    Domagoj Vrgoc,
+  
+    Mingxi Wu,
+  
+
+
+  and
+
+Fred Zemke
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2021</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2112-06217/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://arxiv.org/abs/2112.06217" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalscorrabs-2306-15975/cite.bib b/publication/dblp-journalscorrabs-2306-15975/cite.bib
new file mode 100644
index 00000000..b794d865
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2306-15975/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/corr/abs-2306-15975,
+ author = {Shipeng Qi and Heng Lin and Zhihui Guo and Gábor Szárnyas and Bing Tong and Yan Zhou and Bin Yang and Jiansong Zhang and Zheng Wang and Youren Shen and Changyuan Wang and Parviz Peiravi and Henry Gabb and Ben Steer},
+ date = {2023},
+ doi = {https://doi.org/10.48550/arXiv.2306.15975},
+ eprint = {2306.15975},
+ eprinttype = {arXiv},
+ journal = {CoRR},
+ title = {The LDBC Financial Benchmark},
+ url = {https://arxiv.org/pdf/2306.15975.pdf},
+ volume = {abs/2306.15975}
+}
+
diff --git a/publication/dblp-journalscorrabs-2306-15975/index.html b/publication/dblp-journalscorrabs-2306-15975/index.html
new file mode 100644
index 00000000..82ca0bd5
--- /dev/null
+++ b/publication/dblp-journalscorrabs-2306-15975/index.html
@@ -0,0 +1,558 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Financial Benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalscorrabs-2306-15975/">The LDBC Financial Benchmark</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Shipeng Qi,
+  
+    Heng Lin,
+  
+    Zhihui Guo,
+  
+    Gábor Szárnyas,
+  
+    Bing Tong,
+  
+    Yan Zhou,
+  
+    Bin Yang,
+  
+    Jiansong Zhang,
+  
+    Zheng Wang,
+  
+    Youren Shen,
+  
+    Changyuan Wang,
+  
+    Parviz Peiravi,
+  
+    Henry Gabb,
+  
+
+
+  and
+
+Ben Steer
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> CoRR</div>
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://arxiv.org/pdf/2306.15975.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2306-15975/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2306.15975" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalsdbsk-boncz-fgl-013/cite.bib b/publication/dblp-journalsdbsk-boncz-fgl-013/cite.bib
new file mode 100644
index 00000000..3d9b70a7
--- /dev/null
+++ b/publication/dblp-journalsdbsk-boncz-fgl-013/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/dbsk/BonczFGL013,
+ author = {Boncz, Peter A. and Fundulaki, Irini and Gubichev, Andrey and Larriba-Pey, Josep Lluı́s and Neumann, Thomas},
+ date = {2013},
+ doi = {10.1007/s13222-013-0125-y},
+ journal = {Datenbank-Spektrum},
+ number = {2},
+ pages = {121--129},
+ title = {The Linked Data Benchmark Council Project},
+ url = {https://doi.org/10.1007/s13222-013-0125-y},
+ volume = {13}
+}
+
diff --git a/publication/dblp-journalsdbsk-boncz-fgl-013/index.html b/publication/dblp-journalsdbsk-boncz-fgl-013/index.html
new file mode 100644
index 00000000..97377983
--- /dev/null
+++ b/publication/dblp-journalsdbsk-boncz-fgl-013/index.html
@@ -0,0 +1,546 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The Linked Data Benchmark Council Project</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalsdbsk-boncz-fgl-013/">The Linked Data Benchmark Council Project</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Irini Fundulaki,
+  
+    Andrey Gubichev,
+  
+    Josep Lluı́s Larriba-Pey,
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Datenbank-Spektrum</div>
+  
+
+  <div><b>Publication year:</b> 2013</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsdbsk-boncz-fgl-013/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/s13222-013-0125-y" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1007/s13222-013-0125-y" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalsdebu-erling-12/cite.bib b/publication/dblp-journalsdebu-erling-12/cite.bib
new file mode 100644
index 00000000..655d6a3a
--- /dev/null
+++ b/publication/dblp-journalsdebu-erling-12/cite.bib
@@ -0,0 +1,11 @@
+@article{DBLP:journals/debu/Erling12,
+ author = {Erling, Orri},
+ date = {2012},
+ journal = {IEEE Data Eng. Bull.},
+ number = {1},
+ pages = {3--8},
+ title = {Virtuoso, a Hybrid RDBMS/Graph Column Store},
+ url = {http://sites.computer.org/debull/A12mar/vicol.pdf},
+ volume = {35}
+}
+
diff --git a/publication/dblp-journalsdebu-erling-12/index.html b/publication/dblp-journalsdebu-erling-12/index.html
new file mode 100644
index 00000000..8e2c3797
--- /dev/null
+++ b/publication/dblp-journalsdebu-erling-12/index.html
@@ -0,0 +1,524 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Virtuoso, a Hybrid RDBMS/Graph Column Store</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalsdebu-erling-12/">Virtuoso, a Hybrid RDBMS/Graph Column Store</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Orri Erling
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> IEEE Data Eng. Bull.</div>
+  
+
+  <div><b>Publication year:</b> 2012</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://sites.computer.org/debull/A12mar/vicol.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsdebu-erling-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalsercim-angles-pb-14/cite.bib b/publication/dblp-journalsercim-angles-pb-14/cite.bib
new file mode 100644
index 00000000..64dc0e9c
--- /dev/null
+++ b/publication/dblp-journalsercim-angles-pb-14/cite.bib
@@ -0,0 +1,10 @@
+@article{DBLP:journals/ercim/AnglesPB14,
+ author = {Angles, Renzo and Pham, Minh-Duc and Boncz, Peter A.},
+ date = {2014},
+ journal = {ERCIM News},
+ number = {96},
+ title = {Benchmarking Linked Open Data Management Systems},
+ url = {http://ercim-news.ercim.eu/en96/special/benchmarking-linked-open-data-management-systems},
+ volume = {2014}
+}
+
diff --git a/publication/dblp-journalsercim-angles-pb-14/index.html b/publication/dblp-journalsercim-angles-pb-14/index.html
new file mode 100644
index 00000000..033bf116
--- /dev/null
+++ b/publication/dblp-journalsercim-angles-pb-14/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Benchmarking Linked Open Data Management Systems</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalsercim-angles-pb-14/">Benchmarking Linked Open Data Management Systems</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Minh-Duc Pham,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> ERCIM News</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsercim-angles-pb-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="http://ercim-news.ercim.eu/en96/special/benchmarking-linked-open-data-management-systems" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalsercim-pham-b-14/cite.bib b/publication/dblp-journalsercim-pham-b-14/cite.bib
new file mode 100644
index 00000000..2980c1df
--- /dev/null
+++ b/publication/dblp-journalsercim-pham-b-14/cite.bib
@@ -0,0 +1,10 @@
+@article{DBLP:journals/ercim/PhamB14,
+ author = {Pham, Minh-Duc and Boncz, Peter A.},
+ date = {2014},
+ journal = {ERCIM News},
+ number = {96},
+ title = {MonetDB/RDF: Discovering and Exploiting the Emergent Schema of RDF Data},
+ url = {http://ercim-news.ercim.eu/en96/special/monetdb-rdf-discovering-and-exploiting-the-emergent-schema-of-rdf-data},
+ volume = {2014}
+}
+
diff --git a/publication/dblp-journalsercim-pham-b-14/index.html b/publication/dblp-journalsercim-pham-b-14/index.html
new file mode 100644
index 00000000..bb6ef2be
--- /dev/null
+++ b/publication/dblp-journalsercim-pham-b-14/index.html
@@ -0,0 +1,536 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>MonetDB/RDF: Discovering and Exploiting the Emergent Schema of RDF Data</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalsercim-pham-b-14/">MonetDB/RDF: Discovering and Exploiting the Emergent Schema of RDF Data</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Minh-Duc Pham
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> ERCIM News</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsercim-pham-b-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="http://ercim-news.ercim.eu/en96/special/monetdb-rdf-discovering-and-exploiting-the-emergent-schema-of-rdf-data" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalspvldb-bonifati-dfhhmms-22/cite.bib b/publication/dblp-journalspvldb-bonifati-dfhhmms-22/cite.bib
new file mode 100644
index 00000000..0fbfdbd4
--- /dev/null
+++ b/publication/dblp-journalspvldb-bonifati-dfhhmms-22/cite.bib
@@ -0,0 +1,23 @@
+@article{DBLP:journals/pvldb/BonifatiDFHHMMS22,
+ author = {Angela Bonifati and
+Stefania Dumbrava and
+George Fletcher and
+Jan Hidders and
+Matthias Hofer and
+Wim Martens and
+Filip Murlak and
+Joshua Shinavier and
+Slawek Staworko and
+Dominik Tomaszuk},
+ bibsource = {dblp computer science bibliography, https://dblp.org},
+ biburl = {https://dblp.org/rec/journals/pvldb/BonifatiDFHHMMS22.bib},
+ journal = {Proc. VLDB Endow.},
+ number = {5},
+ pages = {1105--1118},
+ timestamp = {Thu, 19 May 2022 14:28:54 +0200},
+ title = {Threshold Queries in Theory and in the Wild},
+ url = {https://www.vldb.org/pvldb/vol15/p1105-staworko.pdf},
+ volume = {15},
+ year = {2022}
+}
+
diff --git a/publication/dblp-journalspvldb-bonifati-dfhhmms-22/index.html b/publication/dblp-journalspvldb-bonifati-dfhhmms-22/index.html
new file mode 100644
index 00000000..76e3e647
--- /dev/null
+++ b/publication/dblp-journalspvldb-bonifati-dfhhmms-22/index.html
@@ -0,0 +1,546 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Threshold Queries in Theory and in the Wild</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalspvldb-bonifati-dfhhmms-22/">Threshold Queries in Theory and in the Wild</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Angela Bonifati,
+  
+    Stefania Dumbrava,
+  
+    George Fletcher,
+  
+    Jan Hidders,
+  
+    Matthias Hofer,
+  
+    Wim Martens,
+  
+    Filip Murlak,
+  
+    Joshua Shinavier,
+  
+    Slawek Staworko,
+  
+
+
+  and
+
+Dominik Tomaszuk
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Proc. VLDB Endow.</div>
+  
+
+  <div><b>Publication year:</b> 2022</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://www.vldb.org/pvldb/vol15/p1105-staworko.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-bonifati-dfhhmms-22/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/cite.bib b/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/cite.bib
new file mode 100644
index 00000000..577f3807
--- /dev/null
+++ b/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/pvldb/IosupHNHPMCCSAT16,
+ author = {Iosup, Alexandru and Hegeman, Tim and Ngai, Wing Lung and Heldens, Stijn and Prat-Pérez, Arnau and Manhardt, Thomas and Chafi, Hassan and Capota, Mihai and Sundaram, Narayanan and Anderson, Michael J. and Tanase, Ilie Gabriel and Xia, Yinglong and Nai, Lifeng and Boncz, Peter A.},
+ date = {2016},
+ doi = {10.14778/3007263.3007270},
+ journal = {VLDB},
+ number = {13},
+ pages = {1317--1328},
+ title = {LDBC Graphalytics: A Benchmark for Large-Scale Graph Analysis on Parallel and Distributed Platforms},
+ url = {http://www.vldb.org/pvldb/vol9/p1317-iosup.pdf},
+ volume = {9}
+}
+
diff --git a/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/index.html b/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/index.html
new file mode 100644
index 00000000..62a1fb34
--- /dev/null
+++ b/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/index.html
@@ -0,0 +1,558 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Graphalytics: A Benchmark for Large Scale Graph Analysis on Parallel and Distributed Platforms</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/">LDBC Graphalytics: A Benchmark for Large-Scale Graph Analysis on Parallel and Distributed Platforms</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Alexandru Iosup,
+  
+    Tim Hegeman,
+  
+    Wing Lung Ngai,
+  
+    Stijn Heldens,
+  
+    Arnau Prat-Pérez,
+  
+    Thomas Manhardt,
+  
+    Hassan Chafi,
+  
+    Mihai Capota,
+  
+    Narayanan Sundaram,
+  
+    Michael J. Anderson,
+  
+    Ilie Gabriel Tanase,
+  
+    Yinglong Xia,
+  
+    Lifeng Nai,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> VLDB</div>
+  
+
+  <div><b>Publication year:</b> 2016</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="http://www.vldb.org/pvldb/vol9/p1317-iosup.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.14778/3007263.3007270" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/cite.bib b/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/cite.bib
new file mode 100644
index 00000000..55b2330f
--- /dev/null
+++ b/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/cite.bib
@@ -0,0 +1,21 @@
+@article{DBLP:journals/pvldb/SzarnyasWSSBWZB22,
+ author = {Gábor Szárnyas and
+Jack Waudby and
+Benjamin A. Steer and
+Dávid Szakállas and
+Altan Birler and
+Mingxi Wu and
+Yuchen Zhang and
+Peter A. Boncz},
+ bibsource = {dblp computer science bibliography, https://dblp.org},
+ biburl = {https://dblp.org/rec/journals/pvldb/SzarnyasWSSBWZB22.bib},
+ journal = {Proc. VLDB Endow.},
+ number = {4},
+ pages = {877--890},
+ timestamp = {Wed, 11 Jan 2023 17:06:38 +0100},
+ title = {The LDBC Social Network Benchmark: Business Intelligence Workload},
+ url = {https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf},
+ volume = {16},
+ year = {2022}
+}
+
diff --git a/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/index.html b/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/index.html
new file mode 100644
index 00000000..a8fe8c86
--- /dev/null
+++ b/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Social Network Benchmark: Business Intelligence Workload</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/">The LDBC Social Network Benchmark: Business Intelligence Workload</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Altan Birler,
+  
+    Mingxi Wu,
+  
+    Yuchen Zhang,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> Proc. VLDB Endow.</div>
+  
+
+  <div><b>Publication year:</b> 2022</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/ldbc-snb-bi-vldb-2022.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/cite.bib b/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/cite.bib
new file mode 100644
index 00000000..f91b6324
--- /dev/null
+++ b/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/cite.bib
@@ -0,0 +1,12 @@
+@article{DBLP:journals/sigmod/AnglesBLF0ENMKT14,
+ author = {Angles, Renzo and Boncz, Peter A. and Larriba-Pey, Josep Lluı́s and Fundulaki, Irini and Neumann, Thomas and Erling, Orri and Neubauer, Peter and Martı́nez-Bazan, Norbert and Kotsev, Venelin and Toma, Ioan},
+ date = {2014},
+ doi = {10.1145/2627692.2627697},
+ journal = {SIGMOD Rec.},
+ number = {1},
+ pages = {27--31},
+ title = {The Linked Data Benchmark Council: A graph and RDF industry benchmarking effort},
+ url = {https://doi.org/10.1145/2627692.2627697},
+ volume = {43}
+}
+
diff --git a/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/index.html b/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/index.html
new file mode 100644
index 00000000..07c31025
--- /dev/null
+++ b/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/index.html
@@ -0,0 +1,556 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The Linked Data Benchmark Council: A graph and RDF industry benchmarking effort</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/">The Linked Data Benchmark Council: A graph and RDF industry benchmarking effort</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Peter A. Boncz,
+  
+    Josep Lluı́s Larriba-Pey,
+  
+    Irini Fundulaki,
+  
+    Thomas Neumann,
+  
+    Orri Erling,
+  
+    Peter Neubauer,
+  
+    Norbert Martı́nez-Bazan,
+  
+    Venelin Kotsev,
+  
+
+
+  and
+
+Ioan Toma
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> SIGMOD Rec.</div>
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2627692.2627697" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1145/2627692.2627697" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/dblp-journalsws-loizou-ag-15/cite.bib b/publication/dblp-journalsws-loizou-ag-15/cite.bib
new file mode 100644
index 00000000..556d9d20
--- /dev/null
+++ b/publication/dblp-journalsws-loizou-ag-15/cite.bib
@@ -0,0 +1,11 @@
+@article{DBLP:journals/ws/LoizouAG15,
+ author = {Loizou, Antonis and Angles, Renzo and Groth, Paul},
+ date = {2015},
+ doi = {10.1016/j.websem.2014.11.003},
+ journal = {J. Web Semant.},
+ pages = {1--26},
+ title = {On the formulation of performant SPARQL queries},
+ url = {https://doi.org/10.1016/j.websem.2014.11.003},
+ volume = {31}
+}
+
diff --git a/publication/dblp-journalsws-loizou-ag-15/index.html b/publication/dblp-journalsws-loizou-ag-15/index.html
new file mode 100644
index 00000000..39394f82
--- /dev/null
+++ b/publication/dblp-journalsws-loizou-ag-15/index.html
@@ -0,0 +1,542 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>On the formulation of performant SPARQL queries</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/dblp-journalsws-loizou-ag-15/">On the formulation of performant SPARQL queries</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Antonis Loizou,
+  
+    Renzo Angles,
+  
+
+
+  and
+
+Paul Groth
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> J. Web Semant.</div>
+  
+
+  <div><b>Publication year:</b> 2015</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsws-loizou-ag-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1016/j.websem.2014.11.003" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.1016/j.websem.2014.11.003" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/fin-bench-work-charter/cite.bib b/publication/fin-bench-work-charter/cite.bib
new file mode 100644
index 00000000..986f06ad
--- /dev/null
+++ b/publication/fin-bench-work-charter/cite.bib
@@ -0,0 +1,8 @@
+@techreport{FinBenchWorkCharter,
+ author = {Zhihui Guo},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ title = {Work Charter for FinBench v1.0},
+ url = {https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf},
+ year = {2022}
+}
+
diff --git a/publication/fin-bench-work-charter/index.html b/publication/fin-bench-work-charter/index.html
new file mode 100644
index 00000000..c7b399bd
--- /dev/null
+++ b/publication/fin-bench-work-charter/index.html
@@ -0,0 +1,520 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Work Charter for FinBench v1.0</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/fin-bench-work-charter/">Work Charter for FinBench v1.0</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Zhihui Guo
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2022</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/fin-bench-work-charter/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/index.html b/publication/index.html
new file mode 100644
index 00000000..ec9f78bc
--- /dev/null
+++ b/publication/index.html
@@ -0,0 +1,7331 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Publications</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+ <!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+  
+        
+  
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+        
+  
+        <div class="form-row mb-4">
+          <div class="col-auto">Filter publications: </div>
+          <div class="col-auto">
+            <input type="search" class="filter-search" placeholder="Search..." autocapitalize="off" autocomplete="off"
+              autocorrect="off" role="textbox" spellcheck="false">
+          </div>
+          
+          <div class="col-auto">
+            <select class="pub-filters form-control form-control-sm" data-filter-group="year">
+              <option value="*">Any year</option>
+              
+              
+              
+              <option value=".year-2023">
+                2023
+              </option>
+              
+              <option value=".year-2022">
+                2022
+              </option>
+              
+              <option value=".year-2021">
+                2021
+              </option>
+              
+              <option value=".year-2020">
+                2020
+              </option>
+              
+              <option value=".year-2019">
+                2019
+              </option>
+              
+              <option value=".year-2018">
+                2018
+              </option>
+              
+              <option value=".year-2017">
+                2017
+              </option>
+              
+              <option value=".year-2016">
+                2016
+              </option>
+              
+              <option value=".year-2015">
+                2015
+              </option>
+              
+              <option value=".year-2014">
+                2014
+              </option>
+              
+              <option value=".year-2013">
+                2013
+              </option>
+              
+              <option value=".year-2012">
+                2012
+              </option>
+              
+              
+            </select>
+          </div>
+        </div>
+  
+        <div id="container-publications">
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Michael Burbidge
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/ldbc-wc-wc-2023-03/">LDBC GQL Implementation Work Charter 1.1</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2023-03/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.RQON8307" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20240503121744/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Alastair Green
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/ldbc-wc-wc-2023-01/">LDBC Extended GQL Schema (LEX) Work Charter 1.1</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2023-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.SSIF9351" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20240503121451/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Brad Bebee,
+  
+    Altan Birler,
+  
+    Alin Deutsch,
+  
+    George Fletcher,
+  
+    Henry A. Gabb,
+  
+    Denise Gosnell,
+  
+    Alastair Green,
+  
+    Zhihui Guo,
+  
+    Keith W. Hare,
+  
+    Jan Hidders,
+  
+    Alexandru Iosup,
+  
+    Atanas Kiryakov,
+  
+    Tomas Kovatchev,
+  
+    Xinsheng Li,
+  
+    Leonid Libkin,
+  
+    Heng Lin,
+  
+    Xiaojian Luo,
+  
+    Arnau Prat-Pérez,
+  
+    David Püroja,
+  
+    Shipeng Qi,
+  
+    Oskar van Rest,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Bing Tong,
+  
+    Jack Waudby,
+  
+    Mingxi Wu,
+  
+    Bin Yang,
+  
+    Wenyuan Yu,
+  
+    Chen Zhang,
+  
+    Jason Zhang,
+  
+    Yan Zhou,
+  
+
+
+  and
+
+Peter Boncz
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/tpctc-ldbc-organization/">The Linked Data Benchmark Council (LDBC): Driving competition and collaboration in the graph data management space</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/ldbc-organization-tpctc2023-preprint.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/tpctc-ldbc-organization/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2307.04350" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    David Püroja,
+  
+    Jack Waudby,
+  
+    Peter Boncz,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/tpctc-ldbc-snb-interactive-v-2/">The LDBC Social Network Benchmark Interactive workload v2: A transactional graph query benchmark with deep delete operations</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/tpctc-ldbc-snb-interactive-v-2/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2307.04820" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Shipeng Qi,
+  
+    Heng Lin,
+  
+    Zhihui Guo,
+  
+    Gábor Szárnyas,
+  
+    Bing Tong,
+  
+    Yan Zhou,
+  
+    Bin Yang,
+  
+    Jiansong Zhang,
+  
+    Zheng Wang,
+  
+    Youren Shen,
+  
+    Changyuan Wang,
+  
+    Parviz Peiravi,
+  
+    Henry Gabb,
+  
+
+
+  and
+
+Ben Steer
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/dblp-journalscorrabs-2306-15975/">The LDBC Financial Benchmark</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://arxiv.org/pdf/2306.15975.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2306-15975/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2306.15975" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Gábor Szárnyas
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/snb-work-charter/">LDBC Social Network Benchmark task force work charter</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/benchmarks/snb/ldbc-snb-work-charter.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/snb-work-charter/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2023">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+David Püroja
+
+</span>
+
+
+
+  </span>
+  (2023).
+  <a href="/publication/david-puroja-msc/">LDBC Social Network Benchmark Interactive v2</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/david-puroja-msc/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2022">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Alastair Green
+
+</span>
+
+
+
+  </span>
+  (2022).
+  <a href="/publication/ldbc-wc-wc-2022-02/">LDBC Extended GQL Schema (LEX) Work Charter</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2022-02/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.VSBC2149" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20221111163656/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2022">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Zhihui Guo
+
+</span>
+
+
+
+  </span>
+  (2022).
+  <a href="/publication/fin-bench-work-charter/">Work Charter for FinBench v1.0</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/fin-bench-work-charter/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2022">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Angela Bonifati,
+  
+    Stefania Dumbrava,
+  
+    George Fletcher,
+  
+    Jan Hidders,
+  
+    Matthias Hofer,
+  
+    Wim Martens,
+  
+    Filip Murlak,
+  
+    Joshua Shinavier,
+  
+    Slawek Staworko,
+  
+
+
+  and
+
+Dominik Tomaszuk
+
+</span>
+
+
+
+  </span>
+  (2022).
+  <a href="/publication/dblp-journalspvldb-bonifati-dfhhmms-22/">Threshold Queries in Theory and in the Wild</a>.
+  <em>Proc. VLDB Endow.</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://www.vldb.org/pvldb/vol15/p1105-staworko.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-bonifati-dfhhmms-22/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2022">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Altan Birler,
+  
+    Mingxi Wu,
+  
+    Yuchen Zhang,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2022).
+  <a href="/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/">The LDBC Social Network Benchmark: Business Intelligence Workload</a>.
+  <em>Proc. VLDB Endow.</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/ldbc-snb-bi-vldb-2022.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2021">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Alastair Green,
+  
+    Paolo Guagliardo,
+  
+
+
+  and
+
+Leonid Libkin
+
+</span>
+
+
+
+  </span>
+  (2021).
+  <a href="/publication/ldbc-tr-tr-2021-01/">Property graphs and paths in GQL: Mathematical definitions</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-tr-tr-2021-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.TZJP7279" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20211105164539/https://ldbcouncil.org/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2021">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Angela Bonifati,
+  
+    Stefania Dumbrava,
+  
+    George Fletcher,
+  
+    Keith W. Hare,
+  
+    Jan Hidders,
+  
+    Victor E. Lee,
+  
+    Bei Li,
+  
+    Leonid Libkin,
+  
+    Wim Martens,
+  
+    Filip Murlak,
+  
+    Josh Perryman,
+  
+    Ognjen Savkovic,
+  
+    Michael Schmidt,
+  
+    Juan F. Sequeda,
+  
+    Slawek Staworko,
+  
+
+
+  and
+
+Dominik Tomaszuk
+
+</span>
+
+
+
+  </span>
+  (2021).
+  <a href="/publication/dblp-confsigmod-angles-bdfhhlllm-21/">PG-Keys: Keys for Property Graphs</a>.
+  <em>SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-bdfhhlllm-21/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3448016.3457561" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3448016.3457561" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2021">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Alin Deutsch,
+  
+    Nadime Francis,
+  
+    Alastair Green,
+  
+    Keith Hare,
+  
+    Bei Li,
+  
+    Leonid Libkin,
+  
+    Tobias Lindaaker,
+  
+    Victor Marsault,
+  
+    Wim Martens,
+  
+    Jan Michels,
+  
+    Filip Murlak,
+  
+    Stefan Plantikow,
+  
+    Petra Selmer,
+  
+    Hannes Voigt,
+  
+    Oskar van Rest,
+  
+    Domagoj Vrgoc,
+  
+    Mingxi Wu,
+  
+
+
+  and
+
+Fred Zemke
+
+</span>
+
+
+
+  </span>
+  (2021).
+  <a href="/publication/dblp-journalscorrabs-2112-06217/">Graph Pattern Matching in GQL and SQL/PGQ</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2112-06217/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://arxiv.org/abs/2112.06217" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+LDBC Property Graph Schema Working Group
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/ldbc-oaep-oaep-2023-04/">LDBC Property Graph Schema contributions to WG3</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-04/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.OFJF3566" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230405180753/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Karim Karimov,
+  
+    József Marton,
+  
+    Peter A. Boncz,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/dblp-conftpctc-waudby-skmbs-20/">Towards Testing ACID Compliance in the LDBC Social Network Benchmark</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-waudby-skmbs-20/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-030-84924-5_1" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230724043134/https://ldbcouncil.org/docs/papers/ldbc-acid-tpctc2020.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-030-84924-5_1" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    János Benjamin Antal,
+  
+    Alex Averbuch,
+  
+    Altan Birler,
+  
+    Peter Boncz,
+  
+    Márton Búr,
+  
+    Orri Erling,
+  
+    Andrey Gubichev,
+  
+    Vlad Haprian,
+  
+    Moritz Kaufmann,
+  
+    Josep Lluís Larriba Pey,
+  
+    Norbert Martínez,
+  
+    József Marton,
+  
+    Marcus Paradies,
+  
+    Minh-Duc Pham,
+  
+    Arnau Prat-Pérez,
+  
+    David Püroja,
+  
+    Mirko Spasić,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Gábor Szárnyas,
+  
+    Jack Waudby,
+  
+    Mingxi Wu,
+  
+
+
+  and
+
+Yuchen Zhang
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/dblp-journalscorrabs-2001-02299/">The LDBC Social Network Benchmark</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://arxiv.org/pdf/2001.02299.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2001-02299/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2001.02299" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Alexandru Iosup,
+  
+    Ahmed Musaafir,
+  
+    Alexandru Uta,
+  
+    Arnau Prat-Pérez,
+  
+    Gábor Szárnyas,
+  
+    Hassan Chafi,
+  
+    Ilie Gabriel Tanase,
+  
+    Lifeng Nai,
+  
+    Michael J. Anderson,
+  
+    Mihai Capota,
+  
+    Narayanan Sundaram,
+  
+    Peter A. Boncz,
+  
+    Siegfried Depner,
+  
+    Stijn Heldens,
+  
+    Thomas Manhardt,
+  
+    Tim Hegeman,
+  
+    Wing Lung Ngai,
+  
+
+
+  and
+
+Yinglong Xia
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/dblp-journalscorrabs-2011-15028/">The LDBC Graphalytics Benchmark</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://arxiv.org/pdf/2011.15028.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2011-15028/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2011.15028" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Jack Waudby,
+  
+    Benjamin A. Steer,
+  
+    Arnau Prat-Pérez,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/dblp-confsigmod-waudby-sps-20/">Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&#39;s Data Generator</a>.
+  <em>GRADES-NDA at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/datagen-deletes-grades-nda-2020.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-waudby-sps-20/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3398682.3399165" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2020">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Márton Elekes,
+  
+    János Benjamin Antal,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+  </span>
+  (2020).
+  <a href="/publication/dblp-journalscorrabs-2010-12243/">An analysis of the SIGMOD 2014 Programming Contest: Complex queries on the LDBC social network graph</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://arxiv.org/pdf/2010.12243.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-2010-12243/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2019">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Neo4j Query Languages Standards &amp; Research Team
+
+</span>
+
+
+
+  </span>
+  (2019).
+  <a href="/publication/ldbc-oaep-oaep-2023-02/">Introduction to GQL Schema design</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-02/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.EPWQ6741" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230405180825/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2018">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Neo4j SQL Working Group,
+  
+    Peter Furniss,
+  
+
+
+  and
+
+Alastair Green
+
+</span>
+
+
+
+  </span>
+  (2018).
+  <a href="/publication/ldbc-oaep-oaep-2023-01/">SQL/PGQ data model and graph schema</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.QZSK3559" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230405180807/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2018">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Marcelo Arenas,
+  
+    Pablo Barceló,
+  
+    Peter A. Boncz,
+  
+    George H. L. Fletcher,
+  
+    Claudio Gutierrez,
+  
+    Tobias Lindaaker,
+  
+    Marcus Paradies,
+  
+    Stefan Plantikow,
+  
+    Juan F. Sequeda,
+  
+    Oskar van Rest,
+  
+
+
+  and
+
+Hannes Voigt
+
+</span>
+
+
+
+  </span>
+  (2018).
+  <a href="/publication/dblp-confsigmod-angles-abbfglpps-18/">G-CORE: A Core for Future Graph Query Languages</a>.
+  <em>SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-abbfglpps-18/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3183713.3190654" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="http://doi.acm.org/10.1145/3183713.3190654" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2018">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Arnau Prat-Pérez,
+  
+    Alex Averbuch,
+  
+    József Marton,
+  
+    Marcus Paradies,
+  
+    Moritz Kaufmann,
+  
+    Orri Erling,
+  
+    Peter A. Boncz,
+  
+    Vlad Haprian,
+  
+
+
+  and
+
+János Benjamin Antal
+
+</span>
+
+
+
+  </span>
+  (2018).
+  <a href="/publication/dblp-confgrades-szarnyas-pampkeb-18/">An early look at the LDBC Social Network Benchmark&#39;s Business Intelligence workload</a>.
+  <em>GRADES-NDA at SIGMOD/PODS</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/ldbc-snb-bi-grades-nda-2018.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-szarnyas-pampkeb-18/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3210259.3210268" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2017">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez,
+  
+    Joan Guisado-Gámez,
+  
+    Xavier Fernández Salas,
+  
+    Petr Koupy,
+  
+    Siegfried Depner,
+  
+
+
+  and
+
+Davide Basilio Bartolini
+
+</span>
+
+
+
+  </span>
+  (2017).
+  <a href="/publication/dblp-confgrades-prat-perez-gskdb-17/">Towards a property graph generator for benchmarking</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-prat-perez-gskdb-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3078447.3078453" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3078447.3078453" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2017">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Wing Lung Ngai,
+  
+    Tim Hegeman,
+  
+    Stijn Heldens,
+  
+
+
+  and
+
+Alexandru Iosup
+
+</span>
+
+
+
+  </span>
+  (2017).
+  <a href="/publication/dblp-confgrades-ngai-hhi-17/">Granula: Toward Fine-grained Performance Analysis of Large-scale Graph Processing Platforms</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-ngai-hhi-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3078447.3078455" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2017">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Dean De Leo
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2017).
+  <a href="/publication/dblp-confgrades-leo-b-17/">Extending SQL for Computing Shortest Paths</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confgrades-leo-b-17/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3078447.3078457" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/3078447.3078457" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2016">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Mats Rydberg
+
+</span>
+
+
+
+  </span>
+  (2016).
+  <a href="/publication/ldbc-oaep-oaep-2023-03/">Cypher schema constraints proposal</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-03/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.54285/ldbc.KKHM1756" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230405180730/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2016">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Alexandru Iosup,
+  
+    Tim Hegeman,
+  
+    Wing Lung Ngai,
+  
+    Stijn Heldens,
+  
+    Arnau Prat-Pérez,
+  
+    Thomas Manhardt,
+  
+    Hassan Chafi,
+  
+    Mihai Capota,
+  
+    Narayanan Sundaram,
+  
+    Michael J. Anderson,
+  
+    Ilie Gabriel Tanase,
+  
+    Yinglong Xia,
+  
+    Lifeng Nai,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2016).
+  <a href="/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/">LDBC Graphalytics: A Benchmark for Large-Scale Graph Analysis on Parallel and Distributed Platforms</a>.
+  <em>VLDB</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://www.vldb.org/pvldb/vol9/p1317-iosup.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.14778/3007263.3007270" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2016">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Venelin Kotsev,
+  
+    Nikos Minadakis,
+  
+    Vassilis Papakonstantinou,
+  
+    Orri Erling,
+  
+    Irini Fundulaki,
+  
+
+
+  and
+
+Atanas Kiryakov
+
+</span>
+
+
+
+  </span>
+  (2016).
+  <a href="/publication/dblp-confsemweb-kotsev-mpefk-16/">Benchmarking RDF Query Engines: The LDBC Semantic Publishing Benchmark</a>.
+  <em>BLINK at ISWC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://ceur-ws.org/Vol-1700/paper-01.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsemweb-kotsev-mpefk-16/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2015">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Joan Guisado-Gámez
+  
+
+
+  and
+
+Arnau Prat-Pérez
+
+</span>
+
+
+
+  </span>
+  (2015).
+  <a href="/publication/dblp-confsigmod-guisado-gamez-p-14/">Understanding Graph Structure of Wikipedia for Query Expansion</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-guisado-gamez-p-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2764947.2764953" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2764947.2764953" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2015">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Orri Erling,
+  
+    Alex Averbuch,
+  
+    Josep-Lluis Larriba-Pey,
+  
+    Hassan Chafi,
+  
+    Andrey Gubichev,
+  
+    Arnau Prat-Pérez,
+  
+    Minh-Duc Pham,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2015).
+  <a href="/publication/dblp-confsigmod-erling-alcgppb-15/">The LDBC Social Network Benchmark: Interactive Workload</a>.
+  <em>SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/ldbc-snb-interactive-sigmod-2015.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-erling-alcgppb-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2723372.2742786" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2015">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Antonis Loizou,
+  
+    Renzo Angles,
+  
+
+
+  and
+
+Paul Groth
+
+</span>
+
+
+
+  </span>
+  (2015).
+  <a href="/publication/dblp-journalsws-loizou-ag-15/">On the formulation of performant SPARQL queries</a>.
+  <em>J. Web Semant.</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsws-loizou-ag-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1016/j.websem.2014.11.003" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1016/j.websem.2014.11.003" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2015">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Minh-Duc Pham,
+  
+    Linnea Passing,
+  
+    Orri Erling,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2015).
+  <a href="/publication/dblp-confwww-pham-peb-15/">Deriving an Emergent Relational Schema from RDF Data</a>.
+  <em>WWW</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confwww-pham-peb-15/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2736277.2741121" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2736277.2741121" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Norbert Martı́nez-Bazan
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confsigmod-martinez-bazan-d-14/">Using semijoin programs to solve traversal queries in graph databases</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-martinez-bazan-d-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621943" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621943" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Peter A. Boncz,
+  
+    Josep Lluı́s Larriba-Pey,
+  
+    Irini Fundulaki,
+  
+    Thomas Neumann,
+  
+    Orri Erling,
+  
+    Peter Neubauer,
+  
+    Norbert Martı́nez-Bazan,
+  
+    Venelin Kotsev,
+  
+
+
+  and
+
+Ioan Toma
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/">The Linked Data Benchmark Council: A graph and RDF industry benchmarking effort</a>.
+  <em>SIGMOD Rec.</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2627692.2627697" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2627692.2627697" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-conftpctc-gubichev-b-14/">Parameter Curation for Benchmark Queries</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-gubichev-b-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-319-15350-6_8" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230724043030/https://ldbcouncil.org/docs/papers/parameter-curation-tpctc2014.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-319-15350-6_8" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Minh-Duc Pham
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-journalsercim-pham-b-14/">MonetDB/RDF: Discovering and Exploiting the Emergent Schema of RDF Data</a>.
+  <em>ERCIM News</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsercim-pham-b-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="http://ercim-news.ercim.eu/en96/special/monetdb-rdf-discovering-and-exploiting-the-emergent-schema-of-rdf-data" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Venelin Kotsev,
+  
+    Atanas Kiryakov,
+  
+    Irini Fundulaki,
+  
+
+
+  and
+
+Vladimir Alexiev
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/ldbc-spc-specification/">LDBC Semantic Publishing Benchmark (SPB) - v2.0</a>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/benchmarks/spb/ldbc-spb-v2.0-specification.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-spc-specification/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20220119094230/http://ldbcouncil.org/benchmarks/spb/ldbc-spb-v2.0-specification.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Josep Lluı́s Larriba-Pey,
+  
+    Norbert Martı́nez-Bazan,
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confrweb-larriba-pey-md-14/">Introduction to Graph Databases</a>.
+  <em>Reasoning Web. Reasoning on the Web in the Big Data Era - 10th International Summer School 2014, Athens, Greece, September 8-13, 2014. Proceedings</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confrweb-larriba-pey-md-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-319-10587-1_4" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-319-10587-1_4" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev,
+  
+    Renzo Angles,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-conficde-gubichev-ab-14/">How to generate query parameters in RDF benchmarks?</a>.
+  <em>GDM at ICDE</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conficde-gubichev-ab-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1109/ICDEW.2014.6818339" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1109/ICDEW.2014.6818339" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez
+  
+
+
+  and
+
+David Domı́nguez-Sal
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confsigmod-prat-d-14/">How community-like is the structure of synthetically generated graphs?</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-prat-d-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621942" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621942" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Arnau Prat-Pérez,
+  
+    David Dominguez-Sal,
+  
+
+
+  and
+
+Josep Lluı́s Larriba-Pey
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confwww-prat-perez-dl-14/">High quality, scalable and parallel community detection for large real graphs</a>.
+  <em>WWW</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confwww-prat-perez-dl-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2566486.2568010" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2566486.2568010" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Manuel Then
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confsigmod-gubichev-t-14/">Graph Pattern Matching - Do We Have to Reinvent the Wheel?</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-gubichev-t-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621944" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2621934.2621944" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-confedbt-gubichev-014/">Exploiting the query structure for efficient join ordering in SPARQL queries</a>.
+  <em>EDBT</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confedbt-gubichev-014/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.5441/002/edbt.2014.40" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.5441/002/edbt.2014.40" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Orri Erling,
+  
+
+
+  and
+
+Minh-Duc Pham
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-bookscrclinked-14-boncz-ep-14/">Experiences with Virtuoso Cluster RDF Column Store</a>.
+  <em>Linked Data Management</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-bookscrclinked-14-boncz-ep-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="http://www.crcnetbase.com/doi/abs/10.1201/b16859-13" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2014">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Minh-Duc Pham,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2014).
+  <a href="/publication/dblp-journalsercim-angles-pb-14/">Benchmarking Linked Open Data Management Systems</a>.
+  <em>ERCIM News</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsercim-angles-pb-14/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="http://ercim-news.ercim.eu/en96/special/benchmarking-linked-open-data-management-systems" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Thomas Neumann,
+  
+
+
+  and
+
+Orri Erling
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-conftpctc-boncz-ne-13/">TPC-H Analyzed: Hidden Messages and Lessons Learned from an Influential Benchmark</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-boncz-ne-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-319-04936-6_5" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230724043058/https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Ciro Cattuto,
+  
+    Marco Quaggiotto,
+  
+    André Panisson,
+  
+
+
+  and
+
+Alex Averbuch
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-confsigmod-cattuto-qpa-13/">Time-varying social networks in a graph database: a Neo4j use case</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://event.cwi.nl/grades2013/11-averbuch.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-cattuto-qpa-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2484425.2484442" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Peter A. Boncz,
+  
+    Irini Fundulaki,
+  
+    Andrey Gubichev,
+  
+    Josep Lluı́s Larriba-Pey,
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-journalsdbsk-boncz-fgl-013/">The Linked Data Benchmark Council Project</a>.
+  <em>Datenbank-Spektrum</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsdbsk-boncz-fgl-013/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/s13222-013-0125-y" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/s13222-013-0125-y" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev,
+  
+    Srikanta J. Bedathur,
+  
+
+
+  and
+
+Stephan Seufert
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-confsigmod-gubichev-bs-13/">Sparqling Kleene: fast property paths in RDF-3X</a>.
+  <em>First International Workshop on Graph Data Management Experiences and Systems, GRADES 2013, co-located with SIGMOD/PODS 2013, New York, NY, USA, June 24, 2013</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://event.cwi.nl/grades2013/14-gubichev.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-gubichev-bs-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2484425.2484443" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Minh-Duc Pham
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-conficde-pham-13/">Self-organizing structured RDF in MonetDB</a>.
+  <em>GDM at ICDE</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conficde-pham-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1109/ICDEW.2013.6547471" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1109/ICDEW.2013.6547471" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Alex Averbuch
+  
+
+
+  and
+
+Martin Neumann
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-journalscorrabs-1301-5121/">Partitioning Graph Databases - A Quantitative Evaluation</a>.
+  <em>CoRR</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://arxiv.org/pdf/1301.5121.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalscorrabs-1301-5121/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Haixin Ma,
+  
+    Jinxian Wei,
+  
+    Weining Qian,
+  
+    Chengcheng Yu,
+  
+    Fan Xia,
+  
+
+
+  and
+
+Aoying Zhou
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-confsigmod-ma-wqyxz-13/">On benchmarking online social media analytical queries</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://event.cwi.nl/grades2013/10-Ma.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-ma-wqyxz-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2484425.2484435" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Arnau Prat-Pérez,
+  
+    David Dominguez-Sal,
+  
+
+
+  and
+
+Josep Lluı́s Larriba-Pey
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-confsigmod-angles-pdl-13/">Benchmarking database systems for social network applications</a>.
+  <em>GRADES at SIGMOD</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://event.cwi.nl/grades2013/15-Angles.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsigmod-angles-pdl-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2484425.2484440" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2013">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Renzo Angles,
+  
+    Pablo Barceló,
+  
+
+
+  and
+
+Gonzalo Rios
+
+</span>
+
+
+
+  </span>
+  (2013).
+  <a href="/publication/dblp-confamw-angles-br-13/">A Practical Query Language for Graph DBs</a>.
+  <em>Alberto Mendelzon International Workshop</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://ceur-ws.org/Vol-1087/paper8.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confamw-angles-br-13/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2012">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+
+Orri Erling
+
+</span>
+
+
+
+  </span>
+  (2012).
+  <a href="/publication/dblp-journalsdebu-erling-12/">Virtuoso, a Hybrid RDBMS/Graph Column Store</a>.
+  <em>IEEE Data Eng. Bull.</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="http://sites.computer.org/debull/A12mar/vicol.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-journalsdebu-erling-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2012">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Minh-Duc Pham,
+  
+    Peter A. Boncz,
+  
+
+
+  and
+
+Orri Erling
+
+</span>
+
+
+
+  </span>
+  (2012).
+  <a href="/publication/dblp-conftpctc-pham-be-12/">S3G2: A Scalable Structure-Correlated Social Graph Generator</a>.
+  <em>TPCTC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-conftpctc-pham-be-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-642-36727-4_11" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://web.archive.org/web/20230724043113/https://ldbcouncil.org/docs/papers/s3g2-scalable-data-generator-tpctc2012.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-642-36727-4_11" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2012">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Danh Le Phuoc,
+  
+    Minh Dao-Tran,
+  
+    Minh-Duc Pham,
+  
+    Peter A. Boncz,
+  
+    Thomas Eiter,
+  
+
+
+  and
+
+Michael Fink
+
+</span>
+
+
+
+  </span>
+  (2012).
+  <a href="/publication/dblp-confsemweb-phuoc-dpbef-12/">Linked Stream Data Processing Engines: Facts and Figures</a>.
+  <em>ISWC</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confsemweb-phuoc-dpbef-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-642-35173-0_20" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1007/978-3-642-35173-0_20" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2012">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Petros Tsialiamanis,
+  
+    Lefteris Sidirourgos,
+  
+    Irini Fundulaki,
+  
+    Vassilis Christophides,
+  
+
+
+  and
+
+Peter A. Boncz
+
+</span>
+
+
+
+  </span>
+  (2012).
+  <a href="/publication/dblp-confedbt-tsialiamanis-sfcb-12/">Heuristics-based query optimisation for SPARQL</a>.
+  <em>EDBT</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confedbt-tsialiamanis-sfcb-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2247596.2247635" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2247596.2247635" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+  
+          
+          
+          
+  
+          <div class="grid-sizer col-lg-12 isotope-item pubtype- year-2012">
+            
+
+<div class="pub-list-item" style="margin-bottom: 1rem">
+
+  <i class="far fa-file-alt pub-icon" aria-hidden="true"></i>
+
+  
+  
+  <span class="article-metadata li-cite-author">
+    
+
+
+<span>
+
+
+  
+    Andrey Gubichev
+  
+
+
+  and
+
+Thomas Neumann
+
+</span>
+
+
+
+  </span>
+  (2012).
+  <a href="/publication/dblp-confcikm-gubichev-n-12/">Fast approximation of Steiner trees in large graphs</a>.
+  <em>CIKM</em>.
+  
+  <p>
+
+
+
+
+
+
+
+
+
+  
+
+
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm btn-sm js-cite-modal"
+        data-filename="/publication/dblp-confcikm-gubichev-n-12/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2396761.2398460" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+  
+  
+  
+    
+  
+  
+  
+  
+  
+    
+  
+  <a class="btn btn-outline-primary btn-sm btn-sm" href="https://doi.org/10.1145/2396761.2398460" target="_blank" rel="noopener">
+    
+    URL
+  </a>
+
+</p>
+
+  
+  
+</div>
+
+          </div>
+  
+          
+        </div>
+        <div>
+  
+        </div>
+      </div>
+    </div>
+  </div>
+
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/index.xml b/publication/index.xml
new file mode 100644
index 00000000..eab1fe36
--- /dev/null
+++ b/publication/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Publications on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/publication/</link>
+    <description>Recent content in Publications on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 01 Nov 2023 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/publication/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/publication/ldbc-oaep-oaep-2023-01/cite.bib b/publication/ldbc-oaep-oaep-2023-01/cite.bib
new file mode 100644
index 00000000..5cd9e4cb
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-01/cite.bib
@@ -0,0 +1,15 @@
+@techreport{LDBC:OAEP:OAEP-2023-01,
+ annote = {https://web.archive.org/web/20230405180807/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf},
+ author = {Neo4j SQL Working Group and Peter Furniss and Alastair Green},
+ doi = {10.54285/ldbc.QZSK3559},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {may--oct},
+ number = {OAEP-2023-01},
+ organization = {ISO/IEC JTC 1/SC 32 WG3 (Database Languages)},
+ subtitle = {Neo4j 2018 Contributions to WG3 (YTZ, ERF) SQL/PGQ data model and graph schema},
+ title = {SQL/PGQ data model and graph schema},
+ type = {Open Access to External Paper},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf},
+ year = {2018}
+}
+
diff --git a/publication/ldbc-oaep-oaep-2023-01/index.html b/publication/ldbc-oaep-oaep-2023-01/index.html
new file mode 100644
index 00000000..8501b09b
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-01/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>SQL/PGQ data model and graph schema</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-oaep-oaep-2023-01/">SQL/PGQ data model and graph schema</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+      <div><b>Sub-title:</b>
+      Neo4j 2018 Contributions to WG3 (YTZ, ERF) SQL/PGQ data model and graph schema
+      </div>
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Neo4j SQL Working Group,
+  
+    Peter Furniss,
+  
+
+
+  and
+
+Alastair Green
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2018</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.QZSK3559" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230405180807/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-01--SQL_PGQ-data-model-and-graph-schema.DOI.10.54285_ldbc.QZSK3559.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-oaep-oaep-2023-02/cite.bib b/publication/ldbc-oaep-oaep-2023-02/cite.bib
new file mode 100644
index 00000000..dfcecb81
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-02/cite.bib
@@ -0,0 +1,16 @@
+@techreport{LDBC:OAEP:OAEP-2023-02,
+ annote = {https://web.archive.org/web/20230405180825/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf},
+ author = {Neo4j Query Languages Standards & Research Team},
+ doi = {10.54285/ldbc.EPWQ6741},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {oct},
+ note = {Edited by Alastair Green and Hannes Voigt},
+ number = {OAEP-2023-02},
+ organization = {Neo4j Inc.},
+ subtitle = {Neo4j Inc. October 2019, LEX-014},
+ title = {Introduction to GQL Schema design},
+ type = {Open Access to External Paper},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf},
+ year = {2019}
+}
+
diff --git a/publication/ldbc-oaep-oaep-2023-02/index.html b/publication/ldbc-oaep-oaep-2023-02/index.html
new file mode 100644
index 00000000..cfa5d2b2
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-02/index.html
@@ -0,0 +1,536 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Introduction to GQL Schema design</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-oaep-oaep-2023-02/">Introduction to GQL Schema design</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+      <div><b>Sub-title:</b>
+      Neo4j Inc. October 2019, LEX-014
+      </div>
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Neo4j Query Languages Standards &amp; Research Team
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+  <div>
+    <b>Note:</b> Edited by Alastair Green and Hannes Voigt
+  </div>
+  
+
+  
+
+  <div><b>Publication year:</b> 2019</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-02/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.EPWQ6741" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230405180825/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-02--Introduction-to-GQL-Schema-design.DOI.10.54285_ldbc.EPWQ6741.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-oaep-oaep-2023-03/cite.bib b/publication/ldbc-oaep-oaep-2023-03/cite.bib
new file mode 100644
index 00000000..0eb9aa69
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-03/cite.bib
@@ -0,0 +1,15 @@
+@techreport{LDBC:OAEP:OAEP-2023-03,
+ annote = {https://web.archive.org/web/20230405180730/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf},
+ author = {Mats Rydberg},
+ doi = {10.54285/ldbc.KKHM1756},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {dec},
+ number = {OAEP-2023-03},
+ organization = {openCypher community},
+ subtitle = {CIP2016-12-16 “Constraints syntax”},
+ title = {Cypher schema constraints proposal},
+ type = {Open Access to External Paper},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf},
+ year = {2016}
+}
+
diff --git a/publication/ldbc-oaep-oaep-2023-03/index.html b/publication/ldbc-oaep-oaep-2023-03/index.html
new file mode 100644
index 00000000..73a1eff8
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-03/index.html
@@ -0,0 +1,532 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Cypher schema constraints proposal</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-oaep-oaep-2023-03/">Cypher schema constraints proposal</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+      <div><b>Sub-title:</b>
+      CIP2016-12-16 “Constraints syntax”
+      </div>
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Mats Rydberg
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2016</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-03/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.KKHM1756" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230405180730/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-03--Cypher-schema-constraints-proposal.DOI.10.54285_ldbc.KKHM1756.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-oaep-oaep-2023-04/cite.bib b/publication/ldbc-oaep-oaep-2023-04/cite.bib
new file mode 100644
index 00000000..d976590f
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-04/cite.bib
@@ -0,0 +1,16 @@
+@techreport{LDBC:OAEP:OAEP-2023-04,
+ annote = {https://web.archive.org/web/20230405180753/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf},
+ author = {LDBC Property Graph Schema Working Group},
+ doi = {10.54285/ldbc.OFJF3566},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {jun},
+ note = {Edited and presented by Jan Hidders, George Fletcher and Bei Li},
+ number = {OAEP-2023-04},
+ organization = {ISO/IEC JTC 1/SC 32 WG3 (Database Languages)},
+ subtitle = {LDBC Property Graph Schema Working Group (PGSWG) contributions to WG3 (MMX) June 2020},
+ title = {LDBC Property Graph Schema contributions to WG3},
+ type = {Open Access to External Paper},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf},
+ year = {2020}
+}
+
diff --git a/publication/ldbc-oaep-oaep-2023-04/index.html b/publication/ldbc-oaep-oaep-2023-04/index.html
new file mode 100644
index 00000000..ea79d0bd
--- /dev/null
+++ b/publication/ldbc-oaep-oaep-2023-04/index.html
@@ -0,0 +1,536 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Property Graph Schema contributions to WG3</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-oaep-oaep-2023-04/">LDBC Property Graph Schema contributions to WG3</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+      <div><b>Sub-title:</b>
+      LDBC Property Graph Schema Working Group (PGSWG) contributions to WG3 (MMX) June 2020
+      </div>
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+LDBC Property Graph Schema Working Group
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+  <div>
+    <b>Note:</b> Edited and presented by Jan Hidders, George Fletcher and Bei Li
+  </div>
+  
+
+  
+
+  <div><b>Publication year:</b> 2020</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-oaep-oaep-2023-04/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.OFJF3566" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20230405180753/https://ldbcouncil.org/docs/papers/LDBC-Open-Access-External-Paper-OAEP-2023-04--LDBC-Property-Graph-Schema-contributions-to-WG3.DOI.10.54285_ldbc.OFJF3566.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-spc-specification/cite.bib b/publication/ldbc-spc-specification/cite.bib
new file mode 100644
index 00000000..b8fdc8f8
--- /dev/null
+++ b/publication/ldbc-spc-specification/cite.bib
@@ -0,0 +1,11 @@
+@techreport{ldbc-spc-specification,
+ annote = {https://web.archive.org/web/20220119094230/http://ldbcouncil.org/benchmarks/spb/ldbc-spb-v2.0-specification.pdf},
+ author = {Venelin Kotsev and Atanas Kiryakov and Irini Fundulaki and Vladimir Alexiev},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ subtitle = {First Public Draft Release},
+ title = {LDBC Semantic Publishing Benchmark (SPB) - v2.0},
+ type = {Benchmark specification},
+ url = {https://ldbcouncil.org/benchmarks/spb/ldbc-spb-v2.0-specification.pdf},
+ year = {2014}
+}
+
diff --git a/publication/ldbc-spc-specification/index.html b/publication/ldbc-spc-specification/index.html
new file mode 100644
index 00000000..edfeb280
--- /dev/null
+++ b/publication/ldbc-spc-specification/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Semantic Publishing Benchmark (SPB)   v2.0</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-spc-specification/">LDBC Semantic Publishing Benchmark (SPB) - v2.0</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+      <div><b>Sub-title:</b>
+      First Public Draft Release
+      </div>
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Venelin Kotsev,
+  
+    Atanas Kiryakov,
+  
+    Irini Fundulaki,
+  
+
+
+  and
+
+Vladimir Alexiev
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2014</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/benchmarks/spb/ldbc-spb-v2.0-specification.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-spc-specification/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20220119094230/http://ldbcouncil.org/benchmarks/spb/ldbc-spb-v2.0-specification.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-tr-tr-2021-01/cite.bib b/publication/ldbc-tr-tr-2021-01/cite.bib
new file mode 100644
index 00000000..5c8f1d7a
--- /dev/null
+++ b/publication/ldbc-tr-tr-2021-01/cite.bib
@@ -0,0 +1,14 @@
+@techreport{LDBC:TR:TR-2021-01,
+ abstract = {This paper provides precise mathematical definitions of a property graph as specified in the proposed GQL international standard, which is an attributed mixed multigraph with loops. It further defines a partially-oriented walk in such a property graph, which is called a path in GQL, as well as restricted classes of such walks (trails, simple/acyclic paths).},
+ annote = {https://web.archive.org/web/20211105164539/https://ldbcouncil.org/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf},
+ author = {Green, Alastair and Guagliardo, Paolo and Libkin, Leonid},
+ doi = {10.54285/ldbc.TZJP7279},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {Oct},
+ number = {TR-2021-01},
+ title = {Property graphs and paths in GQL: Mathematical definitions},
+ type = {Technical Reports},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf},
+ year = {2021}
+}
+
diff --git a/publication/ldbc-tr-tr-2021-01/index.html b/publication/ldbc-tr-tr-2021-01/index.html
new file mode 100644
index 00000000..78bb5ec7
--- /dev/null
+++ b/publication/ldbc-tr-tr-2021-01/index.html
@@ -0,0 +1,540 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Property graphs and paths in GQL: Mathematical definitions</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-tr-tr-2021-01/">Property graphs and paths in GQL: Mathematical definitions</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Alastair Green,
+  
+    Paolo Guagliardo,
+  
+
+
+  and
+
+Leonid Libkin
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2021</div>
+  
+      <div><b>Abstract:</b>
+      This paper provides precise mathematical definitions of a property graph as specified in the proposed GQL international standard, which is an attributed mixed multigraph with loops. It further defines a partially-oriented walk in such a property graph, which is called a path in GQL, as well as restricted classes of such walks (trails, simple/acyclic paths).
+      </div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-tr-tr-2021-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.TZJP7279" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20211105164539/https://ldbcouncil.org/docs/papers/LDBC-Technical-Report-TR-2021-01--Property-graphs-and-paths-in-GQL-Mathematical-definitions.DOI.10.54285_ldbc.TZJP7279.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-wc-wc-2022-02/cite.bib b/publication/ldbc-wc-wc-2022-02/cite.bib
new file mode 100644
index 00000000..b38d3066
--- /dev/null
+++ b/publication/ldbc-wc-wc-2022-02/cite.bib
@@ -0,0 +1,13 @@
+@techreport{LDBC:WC:WC-2022-02,
+ annote = {https://web.archive.org/web/20221111163656/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf},
+ author = {Alastair Green},
+ doi = {10.54285/ldbc.VSBC2149},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {Nov},
+ number = {WC-2022-02},
+ title = {LDBC Extended GQL Schema (LEX) Work Charter},
+ type = {Work Charter},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf},
+ year = {2022}
+}
+
diff --git a/publication/ldbc-wc-wc-2022-02/index.html b/publication/ldbc-wc-wc-2022-02/index.html
new file mode 100644
index 00000000..0783a8f1
--- /dev/null
+++ b/publication/ldbc-wc-wc-2022-02/index.html
@@ -0,0 +1,528 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Extended GQL Schema (LEX) Work Charter</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-wc-wc-2022-02/">LDBC Extended GQL Schema (LEX) Work Charter</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Alastair Green
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2022</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2022-02/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.VSBC2149" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20221111163656/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2022-02--LDBC-Extended-Graph-Schema--LEX--Work-Charter.DOI.10.54285_ldbc.VSBC2149.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-wc-wc-2023-01/cite.bib b/publication/ldbc-wc-wc-2023-01/cite.bib
new file mode 100644
index 00000000..273f6e80
--- /dev/null
+++ b/publication/ldbc-wc-wc-2023-01/cite.bib
@@ -0,0 +1,13 @@
+@techreport{LDBC:WC:WC-2023-01,
+ annote = {https://web.archive.org/web/20240503121451/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf},
+ author = {Alastair Green},
+ doi = {10.54285/ldbc.SSIF9351},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {Oct},
+ number = {WC-2023-01},
+ title = {LDBC Extended GQL Schema (LEX) Work Charter 1.1},
+ type = {Work Charter},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf},
+ year = {2023}
+}
+
diff --git a/publication/ldbc-wc-wc-2023-01/index.html b/publication/ldbc-wc-wc-2023-01/index.html
new file mode 100644
index 00000000..dcf31eb4
--- /dev/null
+++ b/publication/ldbc-wc-wc-2023-01/index.html
@@ -0,0 +1,528 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Extended GQL Schema (LEX) Work Charter 1.1</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-wc-wc-2023-01/">LDBC Extended GQL Schema (LEX) Work Charter 1.1</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Alastair Green
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2023-01/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.SSIF9351" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20240503121451/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-01--LDBC-Extended-GQL-Schema--LEX--Work-Charter.1.1.DOI.10.54285_ldbc.SSIF9351.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/ldbc-wc-wc-2023-03/cite.bib b/publication/ldbc-wc-wc-2023-03/cite.bib
new file mode 100644
index 00000000..d54b940b
--- /dev/null
+++ b/publication/ldbc-wc-wc-2023-03/cite.bib
@@ -0,0 +1,13 @@
+@techreport{LDBC:WC:WC-2023-03,
+ annote = {https://web.archive.org/web/20240503121744/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf},
+ author = {Michael Burbidge},
+ doi = {10.54285/ldbc.RQON8307},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ month = {Nov},
+ number = {WC-2023-03},
+ title = {LDBC GQL Implementation Work Charter 1.1},
+ type = {Work Charter},
+ url = {https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf},
+ year = {2023}
+}
+
diff --git a/publication/ldbc-wc-wc-2023-03/index.html b/publication/ldbc-wc-wc-2023-03/index.html
new file mode 100644
index 00000000..0eda42bf
--- /dev/null
+++ b/publication/ldbc-wc-wc-2023-03/index.html
@@ -0,0 +1,528 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC GQL Implementation Work Charter 1.1</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/ldbc-wc-wc-2023-03/">LDBC GQL Implementation Work Charter 1.1</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Michael Burbidge
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/ldbc-wc-wc-2023-03/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/10.54285/ldbc.RQON8307" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://web.archive.org/web/20240503121744/https://ldbcouncil.org/docs/papers/LDBC-Work-Charter-WC-2023-03--LDBC-GQL-Implementation-Work-Charter.1.1.DOI.10.54285_ldbc.RQON8307.pdf" target="_blank" rel="noopener">
+ INTERNET ARCHIVE
+</a>
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/snb-work-charter/cite.bib b/publication/snb-work-charter/cite.bib
new file mode 100644
index 00000000..ff19267c
--- /dev/null
+++ b/publication/snb-work-charter/cite.bib
@@ -0,0 +1,8 @@
+@techreport{SnbWorkCharter,
+ author = {Gábor Szárnyas},
+ institution = {Linked Data Benchmark Council (LDBC)},
+ title = {LDBC Social Network Benchmark task force work charter},
+ url = {https://ldbcouncil.org/benchmarks/snb/ldbc-snb-work-charter.pdf},
+ year = {2023}
+}
+
diff --git a/publication/snb-work-charter/index.html b/publication/snb-work-charter/index.html
new file mode 100644
index 00000000..95fbb8de
--- /dev/null
+++ b/publication/snb-work-charter/index.html
@@ -0,0 +1,520 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>LDBC Social Network Benchmark task force work charter</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/snb-work-charter/">LDBC Social Network Benchmark task force work charter</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+
+Gábor Szárnyas
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/benchmarks/snb/ldbc-snb-work-charter.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/snb-work-charter/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/tpctc-ldbc-organization/cite.bib b/publication/tpctc-ldbc-organization/cite.bib
new file mode 100644
index 00000000..7979d289
--- /dev/null
+++ b/publication/tpctc-ldbc-organization/cite.bib
@@ -0,0 +1,9 @@
+@inproceedings{tpctc_ldbc_organization,
+ author = {Gábor Szárnyas and Brad Bebee and Altan Birler and Alin Deutsch and George Fletcher and Henry A. Gabb and Denise Gosnell and Alastair Green and Zhihui Guo and Keith W. Hare and Jan Hidders and Alexandru Iosup and Atanas Kiryakov and Tomas Kovatchev and Xinsheng Li and Leonid Libkin and Heng Lin and Xiaojian Luo and Arnau Prat-Pérez and David Püroja and Shipeng Qi and Oskar van Rest and Benjamin A. Steer and Dávid Szakállas and Bing Tong and Jack Waudby and Mingxi Wu and Bin Yang and Wenyuan Yu and Chen Zhang and Jason Zhang and Yan Zhou and Peter Boncz},
+ booktitle = {TPCTC},
+ date = {2023},
+ doi = {https://doi.org/10.48550/arXiv.2307.04350},
+ title = {The Linked Data Benchmark Council (LDBC): Driving competition and collaboration in the graph data management space},
+ url = {https://ldbcouncil.org/docs/papers/ldbc-organization-tpctc2023-preprint.pdf}
+}
+
diff --git a/publication/tpctc-ldbc-organization/index.html b/publication/tpctc-ldbc-organization/index.html
new file mode 100644
index 00000000..8345b4b7
--- /dev/null
+++ b/publication/tpctc-ldbc-organization/index.html
@@ -0,0 +1,596 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The Linked Data Benchmark Council (LDBC): Driving competition and collaboration in the graph data management space</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/tpctc-ldbc-organization/">The Linked Data Benchmark Council (LDBC): Driving competition and collaboration in the graph data management space</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    Gábor Szárnyas,
+  
+    Brad Bebee,
+  
+    Altan Birler,
+  
+    Alin Deutsch,
+  
+    George Fletcher,
+  
+    Henry A. Gabb,
+  
+    Denise Gosnell,
+  
+    Alastair Green,
+  
+    Zhihui Guo,
+  
+    Keith W. Hare,
+  
+    Jan Hidders,
+  
+    Alexandru Iosup,
+  
+    Atanas Kiryakov,
+  
+    Tomas Kovatchev,
+  
+    Xinsheng Li,
+  
+    Leonid Libkin,
+  
+    Heng Lin,
+  
+    Xiaojian Luo,
+  
+    Arnau Prat-Pérez,
+  
+    David Püroja,
+  
+    Shipeng Qi,
+  
+    Oskar van Rest,
+  
+    Benjamin A. Steer,
+  
+    Dávid Szakállas,
+  
+    Bing Tong,
+  
+    Jack Waudby,
+  
+    Mingxi Wu,
+  
+    Bin Yang,
+  
+    Wenyuan Yu,
+  
+    Chen Zhang,
+  
+    Jason Zhang,
+  
+    Yan Zhou,
+  
+
+
+  and
+
+Peter Boncz
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/ldbc-organization-tpctc2023-preprint.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/tpctc-ldbc-organization/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2307.04350" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publication/tpctc-ldbc-snb-interactive-v-2/cite.bib b/publication/tpctc-ldbc-snb-interactive-v-2/cite.bib
new file mode 100644
index 00000000..378469db
--- /dev/null
+++ b/publication/tpctc-ldbc-snb-interactive-v-2/cite.bib
@@ -0,0 +1,9 @@
+@inproceedings{tpctc_ldbc_snb_interactive_v2,
+ author = {David Püroja and Jack Waudby and Peter Boncz and Gábor Szárnyas},
+ booktitle = {TPCTC},
+ date = {2023},
+ doi = {https://doi.org/10.48550/arXiv.2307.04820},
+ title = {The LDBC Social Network Benchmark Interactive workload v2: A transactional graph query benchmark with deep delete operations},
+ url = {https://ldbcouncil.org/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf}
+}
+
diff --git a/publication/tpctc-ldbc-snb-interactive-v-2/index.html b/publication/tpctc-ldbc-snb-interactive-v-2/index.html
new file mode 100644
index 00000000..a638dac7
--- /dev/null
+++ b/publication/tpctc-ldbc-snb-interactive-v-2/index.html
@@ -0,0 +1,538 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>The LDBC Social Network Benchmark Interactive workload v2: A transactional graph query benchmark with deep delete operations</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+
+
+<div class="pub">
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+<section class="section">
+  <div class="container">
+        <div class="row">
+          <div class="section-subheading article-title col-lg-12 mb-0 mt-0"><a class="article-title-custom" style="color: #151515;" href="/publication/tpctc-ldbc-snb-interactive-v-2/">The LDBC Social Network Benchmark Interactive workload v2: A transactional graph query benchmark with deep delete operations</a>
+
+
+
+
+
+
+
+
+
+
+
+
+  
+
+  
+  
+  
+<div class="article-container pt-3">
+  
+
+  
+
+  
+    
+
+
+<div class="article-metadata">
+
+  
+  
+  
+
+  
+  
+    
+      <div>
+        <b>Author(s):</b> 
+
+
+<span>
+
+
+  
+    David Püroja,
+  
+    Jack Waudby,
+  
+    Peter Boncz,
+  
+
+
+  and
+
+Gábor Szárnyas
+
+</span>
+
+
+
+      </div>
+    
+  
+
+  
+
+  
+    <div><b>Publication venue:</b> TPCTC</div>
+  
+
+  <div><b>Publication year:</b> 2023</div>
+  
+
+  
+
+  
+  
+  
+  
+
+</div>
+
+    
+
+
+
+
+<div class="btn-links mb-3">
+  
+  
+
+
+
+
+
+
+
+
+
+  
+  
+    
+      
+    
+  
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="/docs/papers/ldbc-snb-interactive-v2-tpctc2023-preprint.pdf" target="_blank" rel="noopener">
+  
+ PDF 
+</a>
+
+
+
+
+<a href="#" class="btn btn-outline-primary btn-sm js-cite-modal"
+        data-filename="/publication/tpctc-ldbc-snb-interactive-v-2/cite.bib">
+  
+  BIB
+</a>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<a class="btn btn-outline-primary btn-sm" href="https://doi.org/https://doi.org/10.48550/arXiv.2307.04820" target="_blank" rel="noopener">
+  DOI
+</a>
+
+
+
+
+
+
+</div>
+
+
+  
+</div>
+
+
+          </div>
+          <div class="col-lg-12 mb-0 mt-0">
+            <a href="/publication">« Back to Publications</a>
+          </div>
+        </div>
+
+  </div>
+</section>
+
+
+          
+        
+
+    <div class="space-below"></div>
+
+    <div class="article-style"></div>
+
+    
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  
+  
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+  </div>
+</div>
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/publications/index.html b/publications/index.html
new file mode 100644
index 00000000..ec2ca6e4
--- /dev/null
+++ b/publications/index.html
@@ -0,0 +1,342 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Publications</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        <h2 class="text-white mb-3">Publications</h2>
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Publications</li>
+          </ol>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+
+<!-- Generic page details -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-12">
+        <div class="content">
+          <p>See our <a href="/publication/">publications page</a>.</p>
+
+        </div>
+      </div>
+      
+    </div>
+  </div>
+</section>
+<!-- Generic page details -->
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/scripts/download-graphalytics-data-sets-r2-2xl.sh b/scripts/download-graphalytics-data-sets-r2-2xl.sh
new file mode 100755
index 00000000..8aadf6d8
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-2xl.sh
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo datagen-sf10k-fb  && wget -O datagen-sf10k-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf10k-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-sf10k-fb.tar.zst
+echo graph500-28       && wget -O graph500-28.tar.zst      https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-28.tar.zst      && tar --use-compress-program=unzstd -xvf graph500-28.tar.zst
+echo graph500-29       && wget -O graph500-29.tar.zst      https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-29.tar.zst      && tar --use-compress-program=unzstd -xvf graph500-29.tar.zst
+echo graph500-30       && wget -O graph500-30.tar.zst      https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-30.tar.zst      && tar --use-compress-program=unzstd -xvf graph500-30.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2-l.sh b/scripts/download-graphalytics-data-sets-r2-l.sh
new file mode 100755
index 00000000..c1b1bd99
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-l.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo graph500-25     && wget -O graph500-25.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-25.tar.zst    && tar --use-compress-program=unzstd -xvf graph500-25.tar.zst
+echo datagen-8_5-fb  && wget -O datagen-8_5-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_5-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_5-fb.tar.zst
+echo datagen-8_6-fb  && wget -O datagen-8_6-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_6-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_6-fb.tar.zst
+echo datagen-8_7-zf  && wget -O datagen-8_7-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_7-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_7-zf.tar.zst
+echo datagen-8_8-zf  && wget -O datagen-8_8-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_8-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_8-zf.tar.zst
+echo datagen-8_9-fb  && wget -O datagen-8_9-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_9-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_9-fb.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2-m.sh b/scripts/download-graphalytics-data-sets-r2-m.sh
new file mode 100755
index 00000000..0b235718
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-m.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo graph500-23     && wget -O graph500-23.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-23.tar.zst    && tar --use-compress-program=unzstd -xvf graph500-23.tar.zst
+echo graph500-24     && wget -O graph500-24.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-24.tar.zst    && tar --use-compress-program=unzstd -xvf graph500-24.tar.zst
+echo datagen-8_0-fb  && wget -O datagen-8_0-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_0-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_0-fb.tar.zst
+echo datagen-8_1-fb  && wget -O datagen-8_1-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_1-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_1-fb.tar.zst
+echo datagen-8_2-zf  && wget -O datagen-8_2-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_2-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_2-zf.tar.zst
+echo datagen-8_3-zf  && wget -O datagen-8_3-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_3-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_3-zf.tar.zst
+echo datagen-8_4-fb  && wget -O datagen-8_4-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_4-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-8_4-fb.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2-s.sh b/scripts/download-graphalytics-data-sets-r2-s.sh
new file mode 100755
index 00000000..a46bfff4
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-s.sh
@@ -0,0 +1,14 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo cit-Patents     && wget -O cit-Patents.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/cit-Patents.tar.zst    && tar --use-compress-program=unzstd -xvf cit-Patents.tar.zst
+echo datagen-7_5-fb  && wget -O datagen-7_5-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_5-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-7_5-fb.tar.zst
+echo datagen-7_6-fb  && wget -O datagen-7_6-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_6-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-7_6-fb.tar.zst
+echo datagen-7_7-zf  && wget -O datagen-7_7-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_7-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-7_7-zf.tar.zst
+echo datagen-7_8-zf  && wget -O datagen-7_8-zf.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_8-zf.tar.zst && tar --use-compress-program=unzstd -xvf datagen-7_8-zf.tar.zst
+echo datagen-7_9-fb  && wget -O datagen-7_9-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_9-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-7_9-fb.tar.zst
+echo dota-league     && wget -O dota-league.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/dota-league.tar.zst    && tar --use-compress-program=unzstd -xvf dota-league.tar.zst
+echo graph500-22     && wget -O graph500-22.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-22.tar.zst    && tar --use-compress-program=unzstd -xvf graph500-22.tar.zst
+echo kgs             && wget -O kgs.tar.zst            https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/kgs.tar.zst            && tar --use-compress-program=unzstd -xvf kgs.tar.zst
+echo wiki-Talk       && wget -O wiki-Talk.tar.zst      https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/wiki-Talk.tar.zst      && tar --use-compress-program=unzstd -xvf wiki-Talk.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2-test.sh b/scripts/download-graphalytics-data-sets-r2-test.sh
new file mode 100755
index 00000000..3685a0c9
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-test.sh
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo example-directed      && wget -O example-directed.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-directed.tar.zst     && tar --use-compress-program=unzstd -xvf example-directed.tar.zst
+echo example-undirected    && wget -O example-undirected.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-undirected.tar.zst   && tar --use-compress-program=unzstd -xvf example-undirected.tar.zst
+echo test-bfs-directed     && wget -O test-bfs-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-bfs-directed.tar.zst
+echo test-bfs-undirected   && wget -O test-bfs-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-bfs-undirected.tar.zst
+echo test-cdlp-directed    && wget -O test-cdlp-directed.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-directed.tar.zst   && tar --use-compress-program=unzstd -xvf test-cdlp-directed.tar.zst
+echo test-cdlp-undirected  && wget -O test-cdlp-undirected.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-undirected.tar.zst && tar --use-compress-program=unzstd -xvf test-cdlp-undirected.tar.zst
+echo test-pr-directed      && wget -O test-pr-directed.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-directed.tar.zst     && tar --use-compress-program=unzstd -xvf test-pr-directed.tar.zst
+echo test-pr-undirected    && wget -O test-pr-undirected.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-undirected.tar.zst   && tar --use-compress-program=unzstd -xvf test-pr-undirected.tar.zst
+echo test-lcc-directed     && wget -O test-lcc-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-lcc-directed.tar.zst
+echo test-lcc-undirected   && wget -O test-lcc-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-lcc-undirected.tar.zst
+echo test-wcc-directed     && wget -O test-wcc-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-wcc-directed.tar.zst
+echo test-wcc-undirected   && wget -O test-wcc-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-wcc-undirected.tar.zst
+echo test-sssp-directed    && wget -O test-sssp-directed.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-directed.tar.zst   && tar --use-compress-program=unzstd -xvf test-sssp-directed.tar.zst
+echo test-sssp-undirected  && wget -O test-sssp-undirected.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-undirected.tar.zst && tar --use-compress-program=unzstd -xvf test-sssp-undirected.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2-xl.sh b/scripts/download-graphalytics-data-sets-r2-xl.sh
new file mode 100755
index 00000000..b4a48269
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2-xl.sh
@@ -0,0 +1,14 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo com-friendster   && wget -O com-friendster.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/com-friendster.tar.zst  && tar --use-compress-program=unzstd -xvf com-friendster.tar.zst
+echo datagen-9_0-fb   && wget -O datagen-9_0-fb.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_0-fb.tar.zst  && tar --use-compress-program=unzstd -xvf datagen-9_0-fb.tar.zst
+echo datagen-9_1-fb   && wget -O datagen-9_1-fb.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_1-fb.tar.zst  && tar --use-compress-program=unzstd -xvf datagen-9_1-fb.tar.zst
+echo datagen-9_2-zf   && wget -O datagen-9_2-zf.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_2-zf.tar.zst  && tar --use-compress-program=unzstd -xvf datagen-9_2-zf.tar.zst
+echo datagen-9_3-zf   && wget -O datagen-9_3-zf.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_3-zf.tar.zst  && tar --use-compress-program=unzstd -xvf datagen-9_3-zf.tar.zst
+echo datagen-9_4-fb   && wget -O datagen-9_4-fb.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_4-fb.tar.zst  && tar --use-compress-program=unzstd -xvf datagen-9_4-fb.tar.zst
+echo datagen-sf3k-fb  && wget -O datagen-sf3k-fb.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf3k-fb.tar.zst && tar --use-compress-program=unzstd -xvf datagen-sf3k-fb.tar.zst
+echo graph500-26      && wget -O graph500-26.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-26.tar.zst     && tar --use-compress-program=unzstd -xvf graph500-26.tar.zst
+echo graph500-27      && wget -O graph500-27.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-27.tar.zst     && tar --use-compress-program=unzstd -xvf graph500-27.tar.zst
+echo twitter_mpi      && wget -O twitter_mpi.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/twitter_mpi.tar.zst     && tar --use-compress-program=unzstd -xvf twitter_mpi.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-r2.sh b/scripts/download-graphalytics-data-sets-r2.sh
new file mode 100755
index 00000000..32b6ea48
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-r2.sh
@@ -0,0 +1,55 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo example-directed     && wget -O example-directed.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-directed.tar.zst     && tar --use-compress-program=unzstd -xvf example-directed.tar.zst
+echo example-undirected   && wget -O example-undirected.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/example-undirected.tar.zst   && tar --use-compress-program=unzstd -xvf example-undirected.tar.zst
+echo test-bfs-directed    && wget -O test-bfs-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-bfs-directed.tar.zst
+echo test-bfs-undirected  && wget -O test-bfs-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-bfs-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-bfs-undirected.tar.zst
+echo test-cdlp-directed   && wget -O test-cdlp-directed.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-directed.tar.zst   && tar --use-compress-program=unzstd -xvf test-cdlp-directed.tar.zst
+echo test-cdlp-undirected && wget -O test-cdlp-undirected.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-cdlp-undirected.tar.zst && tar --use-compress-program=unzstd -xvf test-cdlp-undirected.tar.zst
+echo test-pr-directed     && wget -O test-pr-directed.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-directed.tar.zst     && tar --use-compress-program=unzstd -xvf test-pr-directed.tar.zst
+echo test-pr-undirected   && wget -O test-pr-undirected.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-pr-undirected.tar.zst   && tar --use-compress-program=unzstd -xvf test-pr-undirected.tar.zst
+echo test-lcc-directed    && wget -O test-lcc-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-lcc-directed.tar.zst
+echo test-lcc-undirected  && wget -O test-lcc-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-lcc-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-lcc-undirected.tar.zst
+echo test-wcc-directed    && wget -O test-wcc-directed.tar.zst    https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-directed.tar.zst    && tar --use-compress-program=unzstd -xvf test-wcc-directed.tar.zst
+echo test-wcc-undirected  && wget -O test-wcc-undirected.tar.zst  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-wcc-undirected.tar.zst  && tar --use-compress-program=unzstd -xvf test-wcc-undirected.tar.zst
+echo test-sssp-directed   && wget -O test-sssp-directed.tar.zst   https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-directed.tar.zst   && tar --use-compress-program=unzstd -xvf test-sssp-directed.tar.zst
+echo test-sssp-undirected && wget -O test-sssp-undirected.tar.zst https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/test-sssp-undirected.tar.zst && tar --use-compress-program=unzstd -xvf test-sssp-undirected.tar.zst
+echo cit-Patents          && wget -O cit-Patents.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/cit-Patents.tar.zst          && tar --use-compress-program=unzstd -xvf cit-Patents.tar.zst
+echo com-friendster       && wget -O com-friendster.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/com-friendster.tar.zst       && tar --use-compress-program=unzstd -xvf com-friendster.tar.zst
+echo datagen-7_5-fb       && wget -O datagen-7_5-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_5-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-7_5-fb.tar.zst
+echo datagen-7_6-fb       && wget -O datagen-7_6-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_6-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-7_6-fb.tar.zst
+echo datagen-7_7-zf       && wget -O datagen-7_7-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_7-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-7_7-zf.tar.zst
+echo datagen-7_8-zf       && wget -O datagen-7_8-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_8-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-7_8-zf.tar.zst
+echo datagen-7_9-fb       && wget -O datagen-7_9-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-7_9-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-7_9-fb.tar.zst
+echo datagen-8_0-fb       && wget -O datagen-8_0-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_0-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_0-fb.tar.zst
+echo datagen-8_1-fb       && wget -O datagen-8_1-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_1-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_1-fb.tar.zst
+echo datagen-8_2-zf       && wget -O datagen-8_2-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_2-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_2-zf.tar.zst
+echo datagen-8_3-zf       && wget -O datagen-8_3-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_3-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_3-zf.tar.zst
+echo datagen-8_4-fb       && wget -O datagen-8_4-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_4-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_4-fb.tar.zst
+echo datagen-8_5-fb       && wget -O datagen-8_5-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_5-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_5-fb.tar.zst
+echo datagen-8_6-fb       && wget -O datagen-8_6-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_6-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_6-fb.tar.zst
+echo datagen-8_7-zf       && wget -O datagen-8_7-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_7-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_7-zf.tar.zst
+echo datagen-8_8-zf       && wget -O datagen-8_8-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_8-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_8-zf.tar.zst
+echo datagen-8_9-fb       && wget -O datagen-8_9-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-8_9-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-8_9-fb.tar.zst
+echo datagen-9_0-fb       && wget -O datagen-9_0-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_0-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-9_0-fb.tar.zst
+echo datagen-9_1-fb       && wget -O datagen-9_1-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_1-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-9_1-fb.tar.zst
+echo datagen-9_2-zf       && wget -O datagen-9_2-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_2-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-9_2-zf.tar.zst
+echo datagen-9_3-zf       && wget -O datagen-9_3-zf.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_3-zf.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-9_3-zf.tar.zst
+echo datagen-9_4-fb       && wget -O datagen-9_4-fb.tar.zst       https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-9_4-fb.tar.zst       && tar --use-compress-program=unzstd -xvf datagen-9_4-fb.tar.zst
+echo datagen-sf10k-fb     && wget -O datagen-sf10k-fb.tar.zst     https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf10k-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-sf10k-fb.tar.zst
+echo datagen-sf3k-fb      && wget -O datagen-sf3k-fb.tar.zst      https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/datagen-sf3k-fb.tar.zst      && tar --use-compress-program=unzstd -xvf datagen-sf3k-fb.tar.zst
+echo dota-league          && wget -O dota-league.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/dota-league.tar.zst          && tar --use-compress-program=unzstd -xvf dota-league.tar.zst
+echo graph500-22          && wget -O graph500-22.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-22.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-22.tar.zst
+echo graph500-23          && wget -O graph500-23.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-23.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-23.tar.zst
+echo graph500-24          && wget -O graph500-24.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-24.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-24.tar.zst
+echo graph500-25          && wget -O graph500-25.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-25.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-25.tar.zst
+echo graph500-26          && wget -O graph500-26.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-26.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-26.tar.zst
+echo graph500-27          && wget -O graph500-27.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-27.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-27.tar.zst
+echo graph500-28          && wget -O graph500-28.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-28.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-28.tar.zst
+echo graph500-29          && wget -O graph500-29.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-29.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-29.tar.zst
+echo graph500-30          && wget -O graph500-30.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/graph500-30.tar.zst          && tar --use-compress-program=unzstd -xvf graph500-30.tar.zst
+echo kgs                  && wget -O kgs.tar.zst                  https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/kgs.tar.zst                  && tar --use-compress-program=unzstd -xvf kgs.tar.zst
+echo twitter_mpi          && wget -O twitter_mpi.tar.zst          https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/twitter_mpi.tar.zst          && tar --use-compress-program=unzstd -xvf twitter_mpi.tar.zst
+echo wiki-Talk            && wget -O wiki-Talk.tar.zst            https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/graphalytics/wiki-Talk.tar.zst            && tar --use-compress-program=unzstd -xvf wiki-Talk.tar.zst
diff --git a/scripts/download-graphalytics-data-sets-surfsara.sh b/scripts/download-graphalytics-data-sets-surfsara.sh
new file mode 100755
index 00000000..5652903d
--- /dev/null
+++ b/scripts/download-graphalytics-data-sets-surfsara.sh
@@ -0,0 +1,43 @@
+#!/bin/bash
+
+set -euo pipefail
+
+echo cit-Patents.tar.zst         && wget -O cit-Patents.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/cit-Patents.tar.zst        && tar --use-compress-program=unzstd -xvf cit-Patents.tar.zst
+echo com-friendster.tar.zst      && wget -O com-friendster.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/com-friendster.tar.zst     && tar --use-compress-program=unzstd -xvf com-friendster.tar.zst
+echo datagen-7_5-fb.tar.zst      && wget -O datagen-7_5-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-7_5-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-7_5-fb.tar.zst
+echo datagen-7_6-fb.tar.zst      && wget -O datagen-7_6-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-7_6-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-7_6-fb.tar.zst
+echo datagen-7_7-zf.tar.zst      && wget -O datagen-7_7-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-7_7-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-7_7-zf.tar.zst
+echo datagen-7_8-zf.tar.zst      && wget -O datagen-7_8-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-7_8-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-7_8-zf.tar.zst
+echo datagen-7_9-fb.tar.zst      && wget -O datagen-7_9-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-7_9-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-7_9-fb.tar.zst
+echo datagen-8_0-fb.tar.zst      && wget -O datagen-8_0-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_0-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_0-fb.tar.zst
+echo datagen-8_1-fb.tar.zst      && wget -O datagen-8_1-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_1-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_1-fb.tar.zst
+echo datagen-8_2-zf.tar.zst      && wget -O datagen-8_2-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_2-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_2-zf.tar.zst
+echo datagen-8_3-zf.tar.zst      && wget -O datagen-8_3-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_3-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_3-zf.tar.zst
+echo datagen-8_4-fb.tar.zst      && wget -O datagen-8_4-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_4-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_4-fb.tar.zst
+echo datagen-8_5-fb.tar.zst      && wget -O datagen-8_5-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_5-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_5-fb.tar.zst
+echo datagen-8_6-fb.tar.zst      && wget -O datagen-8_6-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_6-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_6-fb.tar.zst
+echo datagen-8_7-zf.tar.zst      && wget -O datagen-8_7-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_7-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_7-zf.tar.zst
+echo datagen-8_8-zf.tar.zst      && wget -O datagen-8_8-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_8-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_8-zf.tar.zst
+echo datagen-8_9-fb.tar.zst      && wget -O datagen-8_9-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-8_9-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-8_9-fb.tar.zst
+echo datagen-9_0-fb.tar.zst      && wget -O datagen-9_0-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-9_0-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-9_0-fb.tar.zst
+echo datagen-9_1-fb.tar.zst      && wget -O datagen-9_1-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-9_1-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-9_1-fb.tar.zst
+echo datagen-9_2-zf.tar.zst      && wget -O datagen-9_2-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-9_2-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-9_2-zf.tar.zst
+echo datagen-9_3-zf.tar.zst      && wget -O datagen-9_3-zf.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-9_3-zf.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-9_3-zf.tar.zst
+echo datagen-9_4-fb.tar.zst      && wget -O datagen-9_4-fb.tar.zst     https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-9_4-fb.tar.zst     && tar --use-compress-program=unzstd -xvf datagen-9_4-fb.tar.zst
+echo datagen-sf10k-fb.tar.zst    && wget -O datagen-sf10k-fb.tar.zst   https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-sf10k-fb.tar.zst   && tar --use-compress-program=unzstd -xvf datagen-sf10k-fb.tar.zst
+echo datagen-sf3k-fb.tar.zst     && wget -O datagen-sf3k-fb.tar.zst    https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/datagen-sf3k-fb.tar.zst    && tar --use-compress-program=unzstd -xvf datagen-sf3k-fb.tar.zst
+echo dota-league.tar.zst         && wget -O dota-league.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/dota-league.tar.zst        && tar --use-compress-program=unzstd -xvf dota-league.tar.zst
+echo example-directed.tar.zst    && wget -O example-directed.tar.zst   https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/example-directed.tar.zst   && tar --use-compress-program=unzstd -xvf example-directed.tar.zst
+echo example-undirected.tar.zst  && wget -O example-undirected.tar.zst https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/example-undirected.tar.zst && tar --use-compress-program=unzstd -xvf example-undirected.tar.zst
+echo graph500-22.tar.zst         && wget -O graph500-22.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-22.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-22.tar.zst
+echo graph500-23.tar.zst         && wget -O graph500-23.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-23.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-23.tar.zst
+echo graph500-24.tar.zst         && wget -O graph500-24.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-24.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-24.tar.zst
+echo graph500-25.tar.zst         && wget -O graph500-25.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-25.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-25.tar.zst
+echo graph500-26.tar.zst         && wget -O graph500-26.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-26.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-26.tar.zst
+echo graph500-27.tar.zst         && wget -O graph500-27.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-27.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-27.tar.zst
+echo graph500-28.tar.zst         && wget -O graph500-28.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-28.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-28.tar.zst
+echo graph500-29.tar.zst         && wget -O graph500-29.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-29.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-29.tar.zst
+echo graph500-30.tar.zst         && wget -O graph500-30.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/graph500-30.tar.zst        && tar --use-compress-program=unzstd -xvf graph500-30.tar.zst
+echo kgs.tar.zst                 && wget -O kgs.tar.zst                https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/kgs.tar.zst                && tar --use-compress-program=unzstd -xvf kgs.tar.zst
+echo twitter_mpi.tar.zst         && wget -O twitter_mpi.tar.zst        https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/twitter_mpi.tar.zst        && tar --use-compress-program=unzstd -xvf twitter_mpi.tar.zst
+echo wiki-Talk.tar.zst           && wget -O wiki-Talk.tar.zst          https://repository.surfsara.nl/datasets/cwi/ldbc-graphalytics-2023/files/wiki-Talk.tar.zst          && tar --use-compress-program=unzstd -xvf wiki-Talk.tar.zst
diff --git a/scss/style.min.css b/scss/style.min.css
new file mode 100644
index 00000000..88a1ed82
--- /dev/null
+++ b/scss/style.min.css
@@ -0,0 +1,5 @@
+/*!------------------------------------------------------------------
+[MAIN STYLESHEET]
+PROJECT: Project Name
+VERSION: Versoin Number
+-------------------------------------------------------------------*/@import "https://fonts.googleapis.com/css?family=Barlow+Condensed:300,400,500,600,700|Open+Sans:300,400,600,700";body{line-height:1.6;font-family:open sans,sans-serif;-webkit-font-smoothing:antialiased;font-size:15px;color:#666}p,.paragraph{font-weight:400;color:#666;font-size:15px;line-height:1.6;font-family:open sans,sans-serif}h1,h2,h3,h4,h5,h6{color:#172231;font-family:barlow condensed,sans-serif;text-transform:uppercase;font-weight:600;line-height:1.2;transition:.2s ease}h1,.h1{font-size:70px}h2,.h2{font-size:48px}h3,.h3{font-size:44px}h4,.h4{font-size:30px}h5,.h5{font-size:18px}h6,.h6{font-size:16px}.btn{font-size:15px;font-family:open sans,sans-serif;text-transform:uppercase;padding:15.5px 28px;border-radius:35px;font-weight:700;border:1px solid;position:relative;z-index:1;transition:.3s ease-in}.btn:focus{outline:0;box-shadow:none!important}.btn:active{box-shadow:none}.btn-lg{font-size:20px;padding:19px 35px}.btn-md{font-size:18px;padding:17px 30px}.btn-sm{font-size:12px;padding:5px 20px}.btn-primary{background:#86c33a;color:#fff;border-color:#86c33a}.btn-primary:active{background:#6b9c2e!important;border-color:#6b9c2e}.btn-primary:hover{background:#6b9c2e;border-color:#6b9c2e}.btn-primary:not(:disabled):not(.disabled).active,.btn-primary:not(:disabled):not(.disabled):active,.show>.btn-primary.dropdown-toggle{color:#fff;background-color:#6b9c2e;border-color:#6b9c2e}.btn-gray{background:#f5f6fa;color:#172231;border-color:#f5f6fa}.btn-gray:active{background:#86c33a!important;border-color:#86c33a;color:#fff}.btn-gray:hover{background:#86c33a;border-color:#86c33a;color:#fff}.btn-primary:not(:disabled):not(.disabled).active,.btn-primary:not(:disabled):not(.disabled):active,.show>.btn-primary.dropdown-toggle{color:#fff;background-color:#6b9c2e;border-color:#6b9c2e}.btn-secondary{background:0 0;color:#172231;padding-left:0;border:0}.btn-secondary:active{background:0 0!important;color:#86c33a}.btn-secondary:hover{background:0 0;color:#86c33a}.btn-secondary:not(:disabled):not(.disabled).active,.btn-secondary:not(:disabled):not(.disabled):active,.show>.btn-secondary.dropdown-toggle{color:#86c33a;background-color:transparent;border:0}.btn-primary-outline{background:0 0;color:#fff;border:2px solid #fff}.btn-primary-outline:active{background:#86c33a!important;border-color:#86c33a;color:#fff}.btn-primary-outline:hover{background:#86c33a;border-color:#86c33a;color:#fff}.btn-light{background:#fff;color:#172231;border-color:#e7e7e7}.btn-light:active{background:0 0!important;border-color:#fff;color:#fff}.btn-light:hover{background:0 0;border-color:#fff;color:#fff}.btn-light-alt:active{background:#86c33a!important;border-color:#86c33a;color:#fff}.btn-light-alt:hover{background:#86c33a;border-color:#86c33a;color:#fff}.btn-light:not(:disabled):not(.disabled).active,.btn-light:not(:disabled):not(.disabled):active,.show>.btn-light.dropdown-toggle{background:0 0;border-color:#fff;color:#fff}.btn-light-outline{background:0 0;color:#fff;border:2px solid #fff}.btn-light-outline:active{background:#6b9c2e!important;border-color:#6b9c2e;color:#fff}.btn-light-outline:hover{background:#6b9c2e;border-color:#6b9c2e;color:#fff}.btn-arrow{transition:.2s ease}.btn-arrow::before{position:absolute;content:'';height:8px;width:8px;background:0 0;top:50%;transform:translateY(-50%)rotate(-45deg);border-right:2px solid #000;border-bottom:2px solid #000;left:calc( 85% + 5px);transition:.2s ease}.btn-arrow::after{position:absolute;content:'';height:2px;width:15px;top:50%;transform:translateY(-50%);background:#000;transition:.2s ease;left:85%}.btn-arrow:hover::before{left:calc( 85% + 10px);border-color:#86c33a}.btn-arrow:hover::after{width:20px;background:#86c33a}.hover-ripple{transition:.2s ease-in}.hover-ripple:hover{transform:scale(.97)}.hover-ripple:hover::after{animation:sonarEffect 1s ease-out 50ms}.hover-ripple::after{pointer-events:none;position:absolute;width:100%;height:100%;content:'';top:0;left:0;padding:0;z-index:-1;opacity:0;transform:scale(.9);border-radius:inherit}.hover-ripple.ripple-white:hover::after{animation:sonarEffectWhite 1s ease-out 50ms}@keyframes sonarEffect{0%{opacity:.1}40%{opacity:.3;box-shadow:0 0 0 2px rgba(255,255,255,.1),0 0 10px 10px #86c33a,0 0 0 10px rgba(255,255,255,.2)}100%{box-shadow:0 0 0 2px rgba(255,255,255,.1),0 0 10px 10px #86c33a,0 0 0 10px rgba(255,255,255,.2);transform:scale(1.2);opacity:0}}@keyframes sonarEffectWhite{0%{opacity:.1}40%{opacity:.3;box-shadow:0 0 0 2px rgba(255,255,255,.1),0 0 10px 10px #fff,0 0 0 10px rgba(255,255,255,.2)}100%{box-shadow:0 0 0 2px rgba(255,255,255,.1),0 0 10px 10px #fff,0 0 0 10px rgba(255,255,255,.2);transform:scale(1.2);opacity:0}}body{background-color:#fff;overflow-x:hidden}::selection{background:#9ed060;color:#fff}.preloader{position:fixed;top:0;left:0;right:0;bottom:0;background-color:#fff;z-index:999;display:flex;align-items:center;justify-content:center;height:100vh;width:100vw}ol,ul{list-style-type:none;margin:0}a,a:hover,a:focus{text-decoration:none}a,button,select{cursor:pointer;transition:.2s ease}a:focus,button:focus,select:focus{outline:0}a:hover{color:#86c33a}a.text-white:hover,a.text-light:hover{color:#86c33a!important}a h4:hover,a h5:hover{color:#86c33a}.slick-slide{outline:0}.section{padding-top:25px;padding-bottom:15px}.section-sm{padding-top:70px;padding-bottom:70px}.section-title{margin-bottom:40px}.section-title-border{position:relative;height:5px;width:30px;background:#86c33a;border-radius:10px;margin-bottom:20px}.section-title-border::before{position:absolute;content:"";height:100%;width:50%;background:#86c33a;border-radius:10px;right:-60%;top:0}.section-title-border::after{position:absolute;content:"";height:100%;width:25%;background:#86c33a;border-radius:10px;right:-100%;top:0}.section-title-border.border-center{margin-left:calc(50% - 27px)}.section-title-border.border-white{background:#fff}.section-title-border.border-white::before{background:#fff}.section-title-border.border-white::after{background:#fff}.section-title-border.border-inline{display:inline-block;margin-bottom:5px}.section-title-sm{font-family:open sans,sans-serif;font-weight:600;color:#666}.section-bottom-lg{padding-bottom:240px}.bg-cover{background-size:cover;background-position:50%;background-repeat:no-repeat}.bg-contain{background-size:contain;background-position:50%;background-repeat:no-repeat}.bg-fixed{background-size:cover;background-repeat:no-repeat;background-position:50%;background-attachment:fixed}.border-color{border-color:#e7e7e7!important}.overlay{position:relative}.overlay::before{position:absolute;content:'';height:100%;width:100%;top:0;left:0;background:#000;opacity:.6}.overlay-secondary{position:relative}.overlay-secondary::before{position:absolute;content:'';height:100%;width:100%;top:0;left:0;background:#252d39;opacity:.85}.outline-0{outline:0!important}.d-unset{display:unset!important}.bg-primary{background:#86c33a!important}.bg-secondary{background:#252d39!important}.bg-secondary-darken{background:#1f2630!important}.bg-gray{background:#f5f6fa!important}.bg-gray-white{background-image:linear-gradient(to right,#f5f6fa 45%,#fff 0%)}.bg-white-gray{background-image:linear-gradient(to right,#fff 45%,#f5f6fa 0%)}.bg-white2-gray{background-image:linear-gradient(to right,#fff 70%,#f5f6fa 0%)}.text-primary{color:#86c33a!important}.text-color{color:#666}.text-light{color:#ddd!important}.text-dark{color:#172231!important}a.text-dark:hover{color:#86c33a!important}.hilighted{background:#252d39;padding:0 5px;border-radius:2px;color:#fff}.letter-spacing{letter-spacing:2px}.mb-50{margin-bottom:50px!important}.mb-60{margin-bottom:60px!important}.mb-70{margin-bottom:70px!important}.mb-80{margin-bottom:80px!important}.mb-90{margin-bottom:90px!important}.mb-100{margin-bottom:100px!important}.zindex-1{z-index:1}.zindex-0{z-index:0}.overflow-hidden{overflow:hidden}.min-height-400{min-height:400px}.border-muted{border-color:#404751!important}.rounded-top-0{border-top-left-radius:0;border-top-right-radius:0}.flex-basis-33{flex-basis:33.333333%}.icon{font-size:40px}.icon-sm{font-size:34px}.icon-xs{font-size:22px}.icon-lg{font-size:56px}.box-shadow{box-shadow:0 15px 39px rgba(8,18,109,.1)}.font-size-30{font-size:30px}.font-weight-semebold{font-weight:600!important}.font-secondary{font-family:barlow condensed,sans-serif!important}.text-decoration-none{text-decoration:none!important}.text-decoration-none:hover{text-decoration:none!important}.border-md-right{border-right:1px solid}@media(max-width:767px){.border-md-right{border:0}}.icon-bg{position:relative;background-color:rgba(134,195,58,.2);display:inline-block;height:100px;width:100px;border-radius:120px 135px 110px 90px}.icon-bg::before{position:absolute;content:"";height:100%;width:100%;top:0;left:5px;background:rgba(134,195,58,5%);border:2px solid #86c33a;border-radius:130px 120px 160px 130px}.icon-bg .icon{line-height:100px}.water-wave{position:relative;animation-name:water-wave;animation-duration:3s;animation-iteration-count:infinite;animation-timing-function:linear}.water-wave::before{animation-name:water-wave-inner;animation-duration:3s;animation-iteration-count:infinite;animation-timing-function:linear}@keyframes water-wave{0%{border-radius:120px 135px 110px 90px}25%{border-radius:130px 140px 100px 110px}50%{border-radius:110px 97px 150px 100px}75%{border-radius:80px 107px 120px 90px}100%{border-radius:120px 135px 110px 90px}}@keyframes water-wave-inner{0%{border-radius:130px 120px 160px 130px}25%{border-radius:100px 147px 140px 120px}50%{border-radius:102px 147px 140px 120px}75%{border-radius:102px 147px 140px 120px}100%{border-radius:130px 120px 160px 130px}}.breadcrumb-item+.breadcrumb-item::before{color:#fff}#map_canvas{height:500px}.form-control{height:55px;padding:0 30px}.form-control-sm{height:45px}.form-control:focus{box-shadow:0 15px 39px rgba(8,18,109,.1);border-color:#86c33a!important}.focus-shadow-none{box-shadow:none!important}textarea.form-control{height:150px}textarea.form-control-sm{height:100px}.content code *{margin-bottom:0}.content h1,.content h2,.content h3,.content h4,.content h5,.content h6{margin-bottom:10px}.content ul,.content ol{padding-left:0}.content ul li,.content ol li{position:relative;padding-left:20px;margin-bottom:10px}.content ul li::before,.content ol li::before{position:absolute;content:"\f10c";font-family:fontawesome;font-size:14px;left:0;top:1px;color:#86c33a;transition:.3s ease}.content table{text-align:left;width:100%;max-width:100%;margin-bottom:1rem;border:1px solid #dee2e6}.content table th,.content table td{padding:.75rem;vertical-align:top;border:1px solid #dee2e6}.content table thead{background:#eef0f7}.content table tbody{background:#f5f6fa}.content table tbody td{text-align:left!important}.content blockquote p{margin-bottom:0;color:#172231;font-style:italic!important}.content pre{padding:10px 20px;background:#f5f6fa}.top-header{font-size:14px}.navigation{position:relative;z-index:1}.navbar{padding:0}.navbar-collapse{padding-bottom:10px;transition:.2s ease}.navbar .nav-item .nav-link{text-transform:uppercase;font-weight:700}.navbar .dropdown:hover .dropdown-menu{visibility:visible;opacity:1;transform:scaleX(1)}.navbar .dropdown-menu{box-shadow:0 3px 9px rgba(0,0,0,.12);padding:15px;border:0;top:100px;left:-25px;border-radius:0;display:block;visibility:hidden;transition:.3s ease;opacity:0;transform:scale(.8);background:#fff}@media(max-width:991px){.navbar .dropdown-menu{display:none;opacity:1;visibility:visible;transform:scale(1);transform-origin:unset}}.navbar .dropdown-menu.view{visibility:visible!important;opacity:1;transform:scale(1)}@media(max-width:991px){.navbar .dropdown-menu.view{display:block}}.navbar .dropdown-menu.show{visibility:hidden}@media(max-width:991px){.navbar .dropdown-menu.show{visibility:visible;display:block}}.navbar .dropdown-item{position:relative;color:#172231;transition:.2s ease;font-family:open sans,sans-serif}@media(max-width:991px){.navbar .dropdown-item{text-align:center}}.navbar .dropdown-item:not(:last-child){margin-bottom:10px}.navbar .dropdown-item:hover{color:#86c33a;background:0 0}.navbar-light .navbar-nav .nav-link{color:#172231}.navbar-light .navbar-nav .nav-link:hover{color:#86c33a}.navbar-expand-lg .navbar-nav .nav-link{padding:40px 15px}@media(max-width:1200px){.navbar-expand-lg .navbar-nav .nav-link{padding:40px 10px}}@media(max-width:991px){.navbar-expand-lg .navbar-nav .nav-link{padding:10px}}.search-btn{border:0;background:0 0}.search-wrapper{position:absolute;top:0;left:0;right:0;height:100%;z-index:2;visibility:hidden;transition:.2s ease;opacity:0}.search-wrapper.open{visibility:visible;opacity:1}.search-box{height:112px;width:100%;border:0;background:#fff;font-size:30px;padding:0}.search-box:focus{box-shadow:none!important}.search-close{position:absolute;right:5px;top:40px;border:0;background:0 0;page-break-after:10px;font-size:20px}.hero-section{padding:80px 0}.hero-slider{overflow-x:hidden;text-shadow:-2px -2px 0 #000,2px -2px 0 #000,-2px 2px 0 #000,2px 2px 0 #000;background:#252d39}.hero-slider .prevArrow{left:-100px}.hero-slider .nextArrow{right:-100px}.hero-slider:hover .prevArrow{left:35px}.hero-slider:hover .nextArrow{right:35px}.hero-slider-item h4{font-size:46px}.slick-track{display:flex!important}.slick-slide{height:inherit!important}.hero-slider-item{background-position:50% 0!important}.banner-feature-wrapper{transform:translateY(-100px)}.banner-feature{transition:.2s ease}.banner-feature:hover,.banner-feature.active{background:#252d39!important}.banner-feature:hover h4,.banner-feature:hover p,.banner-feature.active h4,.banner-feature.active p{color:#fff}.image-bg{position:absolute;top:20%;right:0;z-index:-1}.about-bg-shape{position:absolute;top:0;right:0}.philosophy-bg-shape{position:absolute;left:0;bottom:0}.funfacts{overflow-x:hidden}@media(max-width:991px){.funfacts{background:#252d39}}.funfacts .container{transform:translateX(-50px);position:relative}.funfacts .container::before{position:absolute;content:"";right:100%;top:0;height:100%;width:100%;background:#252d39}@media(max-width:991px){.funfacts .container{transform:translate(0)}.funfacts .container::before{display:none}}@media(max-width:991px){.funfacts h3{font-size:30px}}@media(max-width:767px){.funfacts h3{font-size:35px}}@media(max-width:991px){.funfacts .icon-lg{font-size:40px}}@media(max-width:767px){.funfacts .icon-lg{font-size:50px}}.feature-img-bg{position:relative}.feature-img-bg::before{position:absolute;content:"";background:url(../images/backgrounds/feature-bg.png);top:-100px;right:-120px;height:150%;width:120%;z-index:-1;background-repeat:no-repeat;background-size:contain}@media(max-width:991px){.feature-img-bg::before{display:none}}.play-video{position:absolute;left:0;bottom:20%}.play-icon{display:inline-block;min-width:90px;height:90px;text-align:center;line-height:90px;border-radius:50%;box-shadow:0 15px 39px rgba(8,18,109,.1);font-size:30px}.service-wrapper{transform:translateY(-200px)}.card-icon{position:absolute;height:60px;width:60px;border-radius:50%;background:#86c33a;text-align:center;line-height:60px;color:#fff;font-size:32px;left:15px;top:-90px}.service-bg-dots{position:relative}.service-bg-dots::before{position:absolute;content:"";background:url(../images/backgrounds/service-page-2.png);top:0;right:0;height:100%;width:50%;background-repeat:no-repeat;background-size:cover;z-index:0}.team-member-img img{position:relative;z-index:2}.team-member-img::before{position:absolute;content:"";background:url(../images/backgrounds/team-member-bg.png);top:0;right:0;height:60%;width:60%;background-repeat:no-repeat;background-size:contain;z-index:1;transition:.2s ease}.team-member-img::after{position:absolute;content:"";background:url(../images/backgrounds/team-member-bg.png);bottom:-40px;left:0;height:60%;width:60%;background-repeat:no-repeat;background-size:contain;z-index:1;transition:.2s ease}.team-member:hover .team-member-img::before{top:-20px;right:-20px}.team-member:hover .team-member-img::after{bottom:-60px;left:-20px}.team-member:hover .hover-icon{transform:scale(1);opacity:1}.team-member:hover .hover-icon .social-icon a{transform:scale(1)}.hover-icon{position:absolute;left:0;right:0;bottom:0;background:rgba(134,195,58,.9);transition:.2s ease;transform:scale(.8);z-index:3;opacity:0}.hover-icon .social-icon a{transform:scale(0)}.social-icon li a{display:inline-block;height:35px;width:35px;border-radius:50%;color:#fff;border:1px solid #fff;background:0 0;line-height:35px;text-align:center}.social-icon li a:hover{color:#86c33a;background:#fff}.social-icon-alt li a{display:inline-block;height:60px;width:60px;border-radius:50%;color:#fff;border:1px solid #fff;background:0 0;line-height:55px;text-align:center;font-size:300%}.social-icon-alt li a:hover{color:#fff;background:#86c33a;border-color:#86c33a}.project-item img{transition:.4s ease-in}.project-item:hover img{transform:scale(1.05)}.project-item:hover .hover-overlay{opacity:1}.project-item:hover .hover-overlay a{transform:translateY(-50%)scale(1)}.hover-overlay{position:absolute;height:100%;width:100%;top:0;left:0;text-align:center;background:rgba(134,195,58,.9);transition:.4s ease;opacity:0}.hover-overlay a{position:relative;font-size:46px;color:#fff;top:50%;transform:translateY(-50%)scale(0);transition:.4s ease;display:inline-block}.uni-plus{position:relative;padding:0 20px}.uni-plus::before{position:absolute;content:'';left:50%;top:50%;transform:translate(-50%,-50%);height:40px;width:2px;background:#fff}.uni-plus::after{position:absolute;content:'';left:50%;top:50%;transform:translate(-50%,-50%);height:2px;width:40px;background:#fff}.filter-controls li{cursor:pointer}.filter-controls li.active{color:#86c33a!important}.bg-dots{position:relative}.bg-dots::before{position:absolute;content:"";background:url(../images/backgrounds/testimonial-bg-1.png);top:0;right:0;height:100%;width:100%;background-repeat:no-repeat;background-size:cover;z-index:1}.bg-dots .container{position:relative;z-index:2}.slick-arrow{position:absolute;top:50%;transform:translateY(-50%);z-index:9;height:70px;width:70px;border-radius:50%;background:rgba(134,195,58,.5);color:#fff;border:0;line-height:70px;font-size:35px}.slick-arrow::before{position:absolute;content:'';height:10px;width:10px;background:0 0;top:50%;transform:translateY(-50%)rotate(-45deg);transition:.2s ease}.slick-arrow::after{position:absolute;content:'';height:2px;width:25px;top:50%;transform:translateY(-50%);background:#fff;transition:.2s ease}@media(max-width:575px){.slick-arrow{display:none}}.slick-arrow:focus{outline:0}.slick-arrow:hover{background:#86c33a}.prevArrow{left:0}.prevArrow::before{border-left:2px solid #fff;border-top:2px solid #fff;right:35px}.prevArrow::after{right:20px}.nextArrow{right:0}.nextArrow::before{border-right:2px solid #fff;border-bottom:2px solid #fff;left:35px}.nextArrow::after{left:20px}.testimonial-slider .nextArrow,.testimonial-slider .prevArrow{opacity:0;transition-delay:1s}.testimonial-slider:hover .nextArrow{opacity:1;right:-100px;transition-delay:0s}.testimonial-slider:hover .prevArrow{opacity:1;left:-100px;transition-delay:0s}.bg-quote{position:relative}.bg-quote::before{position:absolute;content:"\f10d";font-family:fontawesome;font-size:150px;color:rgba(134,195,58,.3);top:-10px;line-height:1;left:50%;transform:translateX(-50%)}.slick-dots{padding-left:0;text-align:center;position:absolute;bottom:-185px;left:0;right:0;z-index:9}.slick-dots li{display:inline-block;height:70px;width:70px;border-radius:50%;cursor:pointer;margin:0 20px;transition:.2s ease;box-shadow:0 15px 39px rgba(8,18,109,.1)}.slick-dots li img{height:70px;width:70px;border-radius:50%}.slick-dots li.slick-active{transform:scale(1.2)}.clients-logo{text-align:center;position:relative;height:120px;width:180px}.clients-logo:hover .white{opacity:0}.clients-logo:hover .primary{opacity:1}.clients-logo .white{opacity:1;position:absolute;left:0;top:50%;right:0;transform:translateY(-50%);text-align:center;padding:0 10px}.clients-logo .primary{opacity:0;position:absolute;left:0;top:50%;right:0;transform:translateY(-50%);text-align:center;padding:0 10px}.customer-bg-shape{position:absolute;top:0;right:50%}.list-styled{padding-left:0}.list-styled li{position:relative;padding-left:20px}.list-styled li::before{position:absolute;content:"\f105";font-family:fontawesome;font-size:14px;left:0;top:1px;color:#86c33a;transition:.3s ease}.list-styled li:hover::before{color:#86c33a!important}.list-styled li:hover a{text-decoration:underline}.list-styled li.text-light::before{color:#ddd}.list-styled.style-circle li::before{content:"\f10c"}.newsletter-form{background:rgba(255,255,255,.1);border-radius:35px}.newsletter-form:focus{background:rgba(255,255,255,.1)}.newsletter-form::placeholder{color:#fff}.btn-subscribe{position:absolute;top:0;right:0;border-top-left-radius:0;border-bottom-left-radius:0}.cta-sm-bg{position:relative}.cta-sm-bg::before{position:absolute;content:"";height:100%;width:100%;left:calc(100% - 10%);top:0;background:url(../images/backgrounds/cta-sm-right.png);background-repeat:no-repeat;background-size:contain}.cta-sm-bg::after{position:absolute;content:"";height:100%;width:100%;left:0;top:0;background-image:url(../images/backgrounds/cta-sm-left.png);background-repeat:no-repeat;background-size:contain;z-index:0}.pricing-table{transition:.2s ease;position:relative}.pricing-table::before{position:absolute;content:'';height:100%;width:100%;top:0;left:0;background:url(../images/backgrounds/pricing-table-bg.png);background-repeat:no-repeat;background-size:cover}.pricing-table.active{background:#86c33a;color:#fff}.pricing-table.active h2,.pricing-table.active h3,.pricing-table.active h4,.pricing-table.active h5,.pricing-table.active h6{color:#fff}.pricing-duration{transition:.2s linear}.pricing-duration.active{font-weight:600;color:#172231}.pricing-switcher{text-align:center}.pricing-switcher .fieldset{display:inline-block;position:relative;padding:2px;border-radius:50em;background:#86c33a;height:40px;width:100px}.pricing-switcher input[type=radio]{position:absolute;opacity:0}.pricing-switcher label{position:absolute;z-index:1;cursor:pointer;color:#666;top:50%;transform:translateY(-50%);text-transform:uppercase;font-size:16px}.pricing-switcher label.monthly{right:130px}.pricing-switcher label.monthly::before{position:absolute;content:"";height:30px;width:50px;border-radius:50px;top:50%;transform:translateY(-50%);right:-85px}.pricing-switcher label.yearly{left:130px}.pricing-switcher label.yearly::before{position:absolute;content:"";height:30px;width:50px;border-radius:50px;top:50%;transform:translateY(-50%);left:-85px}.pricing-switcher .switch{position:absolute;top:5px;left:5px;height:30px;width:30px;background-color:#fff;border-radius:50em;transition:transform .3s}.pricing-switcher input[type=radio]:checked+label+.switch,.pricing-switcher input[type=radio]:checked+label:nth-of-type(n)+.switch{transform:translateX(60px)}.pricing-list li{position:relative;padding:0!important}@media only screen and (min-width:768px){.pricing-list{margin:3em 0 0}.pricing-list:after{content:"";display:table;clear:both}.pricing-list>li{width:33.3333333333%;float:left;padding-left:5px;padding-right:5px}}.pricing-wrapper{position:relative}.touch .pricing-wrapper{perspective:2000px}.pricing-wrapper.is-switched .is-visible{transform:rotateY(180deg);animation:rotate .5s}.pricing-wrapper.is-switched .is-hidden{transform:rotateY(0);animation:rotate-inverse .5s;opacity:0}.pricing-wrapper.is-switched .is-selected{opacity:1}.pricing-wrapper.is-switched.reverse-animation .is-visible{transform:rotateY(-180deg);animation:rotate-back .5s}.pricing-wrapper.is-switched.reverse-animation .is-hidden{transform:rotateY(0);animation:rotate-inverse-back .5s;opacity:0}.pricing-wrapper.is-switched.reverse-animation .is-selected{opacity:1}.pricing-wrapper>li{backface-visibility:hidden}.pricing-wrapper .is-visible{position:relative;z-index:5}.pricing-wrapper .is-hidden{position:absolute;top:0;left:0;height:100%;width:100%;z-index:1;transform:rotateY(180deg)}.pricing-wrapper .is-selected{z-index:3!important}@keyframes rotate{0%{transform:perspective(2000px)rotateY(0)}70%{transform:perspective(2000px)rotateY(200deg)}100%{transform:perspective(2000px)rotateY(180deg)}}@keyframes rotate-inverse{0%{transform:perspective(2000px)rotateY(-180deg)}70%{transform:perspective(2000px)rotateY(20deg)}100%{transform:perspective(2000px)rotateY(0)}}@keyframes rotate-back{0%{transform:perspective(2000px)rotateY(0)}70%{transform:perspective(2000px)rotateY(-200deg)}100%{transform:perspective(2000px)rotateY(-180deg)}}@keyframes rotate-inverse-back{0%{transform:perspective(2000px)rotateY(180deg)}70%{transform:perspective(2000px)rotateY(-20deg)}100%{transform:perspective(2000px)rotateY(0)}}.article-container{padding-top:25px;padding-bottom:15px}.article-container-sm{padding-top:70px;padding-bottom:70px}.article-container-title{margin-bottom:40px}.article-container-title-border{position:relative;height:5px;width:30px;background:#86c33a;border-radius:10px;margin-bottom:20px}.article-container-title-border::before{position:absolute;content:"";height:100%;width:50%;background:#86c33a;border-radius:10px;right:-60%;top:0}.article-container-title-border::after{position:absolute;content:"";height:100%;width:25%;background:#86c33a;border-radius:10px;right:-100%;top:0}.article-container-title-border.border-center{margin-left:calc(50% - 27px)}.article-container-title-border.border-white{background:#fff}.article-container-title-border.border-white::before{background:#fff}.article-container-title-border.border-white::after{background:#fff}.article-container-title-border.border-inline{display:inline-block;margin-bottom:5px}.article-container-title-sm{font-family:open sans,sans-serif;font-weight:600;color:#666}.page-subtitle{font-size:1.15rem;color:rgba(0,0,0,.54);margin-bottom:1rem}.dark .page-subtitle{color:rgba(255,255,255,.54)}.article-header{position:relative;clear:both}.article-banner{width:100%;height:auto}.featured-image-wrapper{position:relative;padding-left:0;padding-right:0}.featured-image{position:relative;width:100%;display:block;margin:0 auto}.article-header-caption{position:absolute;bottom:0;right:0;margin:0 auto;padding:2px 5px;color:#fff;font-size:.7em;background:#000;text-align:right;z-index:5;opacity:.65;border-radius:5px 0 0 0}@media(min-width:64em){.article-header-caption{padding:5px 10px}}.article-header-caption a{color:#fff;text-decoration:none}.article-title{font-size:1.75rem}.article-title a{transition:color .6s ease}.dark .text-muted{color:rgba(255,255,255,.54)!important}.article-style{overflow:hidden}.article-style a{text-decoration:#172231}.article-style img,.article-style video{margin-left:auto;margin-right:auto;margin-top:2rem;margin-bottom:2rem;padding:0}.article-style td img,.article-style td video{margin-top:0;margin-bottom:0}.article-style figure{margin-top:2rem;margin-bottom:2rem}.article-style figure img{margin-top:0;margin-bottom:0}.article-metadata{margin-bottom:15px;overflow:hidden;font-size:14px;letter-spacing:.03em;color:rgba(0,0,0,.54)}.article-metadata a{color:rgba(0,0,0,.54)}.article-metadata a:hover{color:#86c33a}.article-metadata .author-notes{cursor:help;padding-left:3px}.article-metadata .author-highlighted{font-weight:700}article .article-metadata{margin-bottom:20px}.dark .article-metadata{color:rgba(255,255,255,.54)}.stream-meta.article-metadata{margin-bottom:5px}.article-categories{white-space:nowrap}.middot-divider{padding-right:.45em;padding-left:.45em;font-size:15px}.middot-divider::after{content:'\00B7'}.content-widget-hr{margin-top:1.2rem;padding-top:1.2rem;border-top:1px solid rgba(0,0,0,5%)}.dark .content-widget-hr{border-top:1px solid rgba(255,255,255,5%)}.article-tags{margin-top:1.2rem}#comments{padding-top:1rem}.article-widget{padding-top:1.2rem}.article-widget h3{margin-top:0}.dark .article-metadata a{color:rgba(255,255,255,.54)}.pub-banner{max-width:100%;height:auto;margin-left:auto;margin-right:auto}.pub-row-heading{font-weight:700}#container-publications{display:block;position:relative;overflow:hidden}.li-cite-author{font-size:1em;color:inherit}.li-cite-author a{color:inherit}.dark .li-cite-author a{color:#f8f8f2}.card-type{position:absolute;top:30px;left:30px;padding:3px 10px;color:#fff;background:#86c33a;z-index:1}.card-meta{font-size:14px}.blog-shape-left{position:absolute;left:0;bottom:0}.blog-shape-right{position:absolute;right:0;top:50%}.clip-half-cycle{clip-path:circle(157% at 50% -100%)}.title-border-left{position:relative;padding-left:30px}.title-border-left::before{position:absolute;left:0;top:0;content:"";height:100%;width:5px;border-radius:30px;background:#86c33a}.post-search{border:0;background:0 0;position:absolute;bottom:15px;right:0}.tag-list a{display:inline-block;padding:3px 10px;background:#fff;box-shadow:0 5px 20px rgba(51,77,128,.12);border-radius:30px;margin-bottom:10px;color:#666}.tag-list a:hover{background:#86c33a;color:#fff;box-shadow:0}blockquote{padding:30px 40px;font-style:italic;color:#172231;border-left:2px solid #86c33a;box-shadow:0 15px 39px rgba(8,18,109,.1);position:relative;margin-bottom:40px}blockquote::before{position:absolute;content:"\f10d";font-family:fontawesome;font-size:100px;color:rgba(134,195,58,.3);top:50%;left:50%;transform:translate(-50%,-50%);font-style:normal}blockquote p{font-style:normal;margin-top:10px}.post-thumb-sm{height:70px;width:100px;object-fit:cover}.pagination .page-item{margin:5px}.pagination .page-item .page-link{border-radius:50%;background:#fff;color:#86c33a;border:1px solid #86c33a;box-shadow:none;height:50px;width:50px;line-height:45px;text-align:center;padding:0}.pagination .page-item.active .page-link{background:#86c33a;color:#fff}*{box-sizing:border-box}body{font-family:open sans,sans-serif;color:#666}.wrapper{padding:5px;max-width:960px;width:95%;margin:20px auto}header{padding:0 15px}.columns{display:flex;flex-flow:row wrap;justify-content:center;margin:5px 0}.column{flex:1;border:1px solid gray;margin:2px;padding:10px}.column:first-child{margin-left:0}.column:last-child{margin-right:0}@media screen and (max-width:980px){.columns .column{margin-bottom:5px;flex-basis:40%}.columns .column:nth-last-child(2){margin-right:0}.columns .column:last-child{flex-basis:100%;margin:0}}@media screen and (max-width:680px){.columns .column{flex-basis:100%;margin:0 0 5px}}.row-eq-height{display:-webkit-box;display:-webkit-flex;display:-ms-flexbox;display:flex}.company-logo{vertical-align:middle;max-height:175px;max-width:300px;height:auto;width:auto;padding-bottom:55px}.sponsor-company-logo{vertical-align:middle;max-height:175px;max-width:410px;height:auto;width:auto;padding-bottom:55px}
\ No newline at end of file
diff --git a/sitemap.xml b/sitemap.xml
new file mode 100644
index 00000000..cff0a566
--- /dev/null
+++ b/sitemap.xml
@@ -0,0 +1,572 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
+  xmlns:xhtml="http://www.w3.org/1999/xhtml">
+  <url>
+    <loc>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</loc>
+    <lastmod>2024-08-30T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/</loc>
+    <lastmod>2024-08-30T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/</loc>
+    <lastmod>2024-08-30T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/</loc>
+    <lastmod>2024-08-30T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/tuc-meeting/</loc>
+    <lastmod>2024-08-30T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/chile/</loc>
+    <lastmod>2024-06-09T09:00:00-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/santiago/</loc>
+    <lastmod>2024-06-09T09:00:00-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</loc>
+    <lastmod>2024-06-09T09:00:00-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/benchmark/</loc>
+    <lastmod>2024-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/</loc>
+    <lastmod>2024-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</loc>
+    <lastmod>2024-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/snb/</loc>
+    <lastmod>2024-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/gql/</loc>
+    <lastmod>2024-05-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</loc>
+    <lastmod>2024-05-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/pages/opengql-announce/</loc>
+    <lastmod>2024-05-03T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/pages/</loc>
+    <lastmod>2024-05-03T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-wc-wc-2023-03/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-wc-wc-2023-01/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</loc>
+    <lastmod>2023-06-27T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/finbench/</loc>
+    <lastmod>2023-06-27T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</loc>
+    <lastmod>2023-06-23T09:00:00-08:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/datagen/</loc>
+    <lastmod>2023-02-15T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</loc>
+    <lastmod>2023-02-15T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/david-puroja-msc/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/snb-work-charter/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-2306-15975/</loc>
+    <lastmod>2024-07-03T12:02:34+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/tpctc-ldbc-snb-interactive-v-2/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/tpctc-ldbc-organization/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-wc-wc-2022-02/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</loc>
+    <lastmod>2022-09-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</loc>
+    <lastmod>2022-06-17T09:20:00-05:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</loc>
+    <lastmod>2022-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalspvldb-szarnyas-wssbwzb-22/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalspvldb-bonifati-dfhhmms-22/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/fin-bench-work-charter/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-tr-tr-2021-01/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</loc>
+    <lastmod>2021-08-16T16:00:00+02:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-2112-06217/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-angles-bdfhhlllm-21/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</loc>
+    <lastmod>2020-06-30T14:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</loc>
+    <lastmod>2020-06-12T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-04/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-2010-12243/</loc>
+    <lastmod>2024-07-03T12:02:34+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-waudby-sps-20/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-2011-15028/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-2001-02299/</loc>
+    <lastmod>2024-07-03T12:02:34+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conftpctc-waudby-skmbs-20/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-02/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/twelfth-tuc-meeting/</loc>
+    <lastmod>2019-07-05T08:30:00+01:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/eleventh-tuc-meeting/</loc>
+    <lastmod>2018-06-08T08:30:00-05:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-01/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confgrades-szarnyas-pampkeb-18/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-angles-abbfglpps-18/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/tenth-tuc-meeting/</loc>
+    <lastmod>2017-09-01T10:30:00+01:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/ninth-tuc-meeting/</loc>
+    <lastmod>2017-02-09T15:07:18-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confgrades-leo-b-17/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confgrades-ngai-hhi-17/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confgrades-prat-perez-gskdb-17/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-oaep-oaep-2023-03/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/graphalytics/</loc>
+    <lastmod>2016-09-06T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</loc>
+    <lastmod>2016-09-06T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/tu-delft/</loc>
+    <lastmod>2016-09-06T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/eighth-tuc-meeting/</loc>
+    <lastmod>2016-06-22T14:45:20-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsemweb-kotsev-mpefk-16/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalspvldb-iosup-hnhpmccsat-16/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/flink/</loc>
+    <lastmod>2015-11-16T14:47:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-and-apache-flink/</loc>
+    <lastmod>2015-11-16T14:47:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/seventh-tuc-meeting/</loc>
+    <lastmod>2015-11-09T14:17:30-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</loc>
+    <lastmod>2015-06-16T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/instance-matching/</loc>
+    <lastmod>2015-06-16T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/spb/</loc>
+    <lastmod>2015-06-16T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/interactive/</loc>
+    <lastmod>2015-06-10T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</loc>
+    <lastmod>2015-06-10T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/grades/</loc>
+    <lastmod>2015-05-29T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/sigmod/</loc>
+    <lastmod>2015-05-29T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</loc>
+    <lastmod>2015-05-29T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/workshop/</loc>
+    <lastmod>2015-05-29T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</loc>
+    <lastmod>2015-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/virtuoso/</loc>
+    <lastmod>2015-05-26T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</loc>
+    <lastmod>2015-05-25T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</loc>
+    <lastmod>2015-05-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/driver/</loc>
+    <lastmod>2015-04-21T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</loc>
+    <lastmod>2015-04-21T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</loc>
+    <lastmod>2015-04-10T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/social-network/</loc>
+    <lastmod>2015-04-10T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/sixth-tuc-meeting/</loc>
+    <lastmod>2015-03-19T13:53:33-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</loc>
+    <lastmod>2015-03-15T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/industry/</loc>
+    <lastmod>2015-03-03T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</loc>
+    <lastmod>2015-03-03T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/developer/</loc>
+    <lastmod>2015-02-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</loc>
+    <lastmod>2015-02-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</loc>
+    <lastmod>2015-02-04T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</loc>
+    <lastmod>2015-01-23T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</loc>
+    <lastmod>2015-01-20T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/guide/</loc>
+    <lastmod>2015-01-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/rdf/</loc>
+    <lastmod>2015-01-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</loc>
+    <lastmod>2015-01-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/sesame/</loc>
+    <lastmod>2015-01-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/tutorial/</loc>
+    <lastmod>2015-01-13T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confwww-pham-peb-15/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalsws-loizou-ag-15/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-erling-alcgppb-15/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-guisado-gamez-p-14/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</loc>
+    <lastmod>2014-12-30T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/bi/</loc>
+    <lastmod>2014-12-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</loc>
+    <lastmod>2014-12-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/amazon/</loc>
+    <lastmod>2014-12-17T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/aws/</loc>
+    <lastmod>2014-12-17T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/ec2/</loc>
+    <lastmod>2014-12-17T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</loc>
+    <lastmod>2014-12-17T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</loc>
+    <lastmod>2014-12-06T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-driver-part-1/</loc>
+    <lastmod>2014-11-27T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/tpc-c/</loc>
+    <lastmod>2014-11-27T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</loc>
+    <lastmod>2014-11-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/test-run/</loc>
+    <lastmod>2014-11-18T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/fifth-tuc-meeting/</loc>
+    <lastmod>2014-11-14T12:32:22-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</loc>
+    <lastmod>2014-11-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/sparql/</loc>
+    <lastmod>2014-11-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/database/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/design/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/ldbc/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/social-network-benchmark-goals/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</loc>
+    <lastmod>2014-10-14T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/analytics/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/benchmarking/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/bersys/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/cfp/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/getting-started-with-snb/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/making-it-interactive/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/snb-data-generator-getting-started/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/the-day-of-graph-analytics/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/tags/tpc/</loc>
+    <lastmod>2014-10-09T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</loc>
+    <lastmod>2014-08-20T00:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/fourth-tuc-meeting/</loc>
+    <lastmod>2014-04-03T12:32:22-04:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalsercim-angles-pb-14/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-bookscrclinked-14-boncz-ep-14/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confedbt-gubichev-014/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-gubichev-t-14/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confwww-prat-perez-dl-14/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-prat-d-14/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conficde-gubichev-ab-14/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confrweb-larriba-pey-md-14/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/ldbc-spc-specification/</loc>
+    <lastmod>2024-07-03T12:02:38+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalsercim-pham-b-14/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conftpctc-gubichev-b-14/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalssigmod-angles-blf-0-enmkt-14/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-martinez-bazan-d-14/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/third-tuc-meeting/</loc>
+    <lastmod>2013-11-19T08:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/second-tuc-meeting/</loc>
+    <lastmod>2013-04-22T10:00:00+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confamw-angles-br-13/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-angles-pdl-13/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-ma-wqyxz-13/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalscorrabs-1301-5121/</loc>
+    <lastmod>2024-07-03T12:02:34+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conficde-pham-13/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-gubichev-bs-13/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalsdbsk-boncz-fgl-013/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsigmod-cattuto-qpa-13/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conftpctc-boncz-ne-13/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/event/first-tuc-meeting/</loc>
+    <lastmod>2012-11-19T09:00:00+01:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confcikm-gubichev-n-12/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confedbt-tsialiamanis-sfcb-12/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-confsemweb-phuoc-dpbef-12/</loc>
+    <lastmod>2024-07-03T12:02:36+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-conftpctc-pham-be-12/</loc>
+    <lastmod>2024-07-03T12:02:37+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/publication/dblp-journalsdebu-erling-12/</loc>
+    <lastmod>2024-07-03T12:02:35+00:00</lastmod>
+  </url><url>
+    <loc>https://ldbcouncil.org/events/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/pages/page-name/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/posts/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/becoming-a-member/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/constitutional-documents/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/developer-community/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/elwg/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/fair-use-policies/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/fswg/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/introduction/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/jan-2-2006/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/lex/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/finbench/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/overview/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/graphalytics/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/spb/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/snb-bi/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/snb-interactive/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/snb/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/snb/audited-results-v0.2.2/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/leadership/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/organizational-members/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/benchmarks/overview/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/gql-community/pgswg/</loc>
+  </url><url>
+    <loc>https://ldbcouncil.org/publications/</loc>
+  </url>
+</urlset>
diff --git a/tags/amazon/index.html b/tags/amazon/index.html
new file mode 100644
index 00000000..c4a5216b
--- /dev/null
+++ b/tags/amazon/index.html
@@ -0,0 +1,1276 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>amazon</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">amazon</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">amazon</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/amazon/index.xml b/tags/amazon/index.xml
new file mode 100644
index 00000000..f0164f98
--- /dev/null
+++ b/tags/amazon/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>amazon on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/amazon/</link>
+    <description>Recent content in amazon on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 17 Dec 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/amazon/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/amazon/page/1/index.html b/tags/amazon/page/1/index.html
new file mode 100644
index 00000000..15024c02
--- /dev/null
+++ b/tags/amazon/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/amazon/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/amazon/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/amazon/">
+  </head>
+</html>
diff --git a/tags/analytics/index.html b/tags/analytics/index.html
new file mode 100644
index 00000000..1d0c9622
--- /dev/null
+++ b/tags/analytics/index.html
@@ -0,0 +1,1274 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>analytics</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">analytics</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">analytics</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/analytics/index.xml b/tags/analytics/index.xml
new file mode 100644
index 00000000..e9094fe2
--- /dev/null
+++ b/tags/analytics/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>analytics on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/analytics/</link>
+    <description>Recent content in analytics on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/analytics/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/analytics/page/1/index.html b/tags/analytics/page/1/index.html
new file mode 100644
index 00000000..e16c00dc
--- /dev/null
+++ b/tags/analytics/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/analytics/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/analytics/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/analytics/">
+  </head>
+</html>
diff --git a/tags/aws/index.html b/tags/aws/index.html
new file mode 100644
index 00000000..51cae48f
--- /dev/null
+++ b/tags/aws/index.html
@@ -0,0 +1,1276 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>aws</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">aws</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">aws</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/aws/index.xml b/tags/aws/index.xml
new file mode 100644
index 00000000..469b8e4d
--- /dev/null
+++ b/tags/aws/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>aws on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/aws/</link>
+    <description>Recent content in aws on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 17 Dec 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/aws/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/aws/page/1/index.html b/tags/aws/page/1/index.html
new file mode 100644
index 00000000..a05ca481
--- /dev/null
+++ b/tags/aws/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/aws/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/aws/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/aws/">
+  </head>
+</html>
diff --git a/tags/benchmark/index.html b/tags/benchmark/index.html
new file mode 100644
index 00000000..907afffb
--- /dev/null
+++ b/tags/benchmark/index.html
@@ -0,0 +1,1370 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>benchmark</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">benchmark</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">benchmark</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/benchmark/index.xml b/tags/benchmark/index.xml
new file mode 100644
index 00000000..611b0f92
--- /dev/null
+++ b/tags/benchmark/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>benchmark on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/benchmark/</link>
+    <description>Recent content in benchmark on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 26 May 2024 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/benchmark/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/benchmark/page/1/index.html b/tags/benchmark/page/1/index.html
new file mode 100644
index 00000000..7a51e0ff
--- /dev/null
+++ b/tags/benchmark/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/benchmark/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/benchmark/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/benchmark/">
+  </head>
+</html>
diff --git a/tags/benchmarking/index.html b/tags/benchmarking/index.html
new file mode 100644
index 00000000..65e010cf
--- /dev/null
+++ b/tags/benchmarking/index.html
@@ -0,0 +1,1277 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>benchmarking</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">benchmarking</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">benchmarking</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/benchmarking/index.xml b/tags/benchmarking/index.xml
new file mode 100644
index 00000000..9084d659
--- /dev/null
+++ b/tags/benchmarking/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>benchmarking on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/benchmarking/</link>
+    <description>Recent content in benchmarking on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/benchmarking/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/benchmarking/page/1/index.html b/tags/benchmarking/page/1/index.html
new file mode 100644
index 00000000..0a0cdfea
--- /dev/null
+++ b/tags/benchmarking/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/benchmarking/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/benchmarking/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/benchmarking/">
+  </head>
+</html>
diff --git a/tags/bersys/index.html b/tags/bersys/index.html
new file mode 100644
index 00000000..eb739ec6
--- /dev/null
+++ b/tags/bersys/index.html
@@ -0,0 +1,1275 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>bersys</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">bersys</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">bersys</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/bersys/index.xml b/tags/bersys/index.xml
new file mode 100644
index 00000000..dde9bcbb
--- /dev/null
+++ b/tags/bersys/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>bersys on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/bersys/</link>
+    <description>Recent content in bersys on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/bersys/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/bersys/page/1/index.html b/tags/bersys/page/1/index.html
new file mode 100644
index 00000000..60a1dad0
--- /dev/null
+++ b/tags/bersys/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/bersys/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/bersys/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/bersys/">
+  </head>
+</html>
diff --git a/tags/bi/index.html b/tags/bi/index.html
new file mode 100644
index 00000000..57d1a29b
--- /dev/null
+++ b/tags/bi/index.html
@@ -0,0 +1,1327 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>bi</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">bi</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">bi</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/bi/index.xml b/tags/bi/index.xml
new file mode 100644
index 00000000..15365d36
--- /dev/null
+++ b/tags/bi/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>bi on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/bi/</link>
+    <description>Recent content in bi on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 18 Dec 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/bi/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/bi/page/1/index.html b/tags/bi/page/1/index.html
new file mode 100644
index 00000000..316b5e78
--- /dev/null
+++ b/tags/bi/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/bi/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/bi/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/bi/">
+  </head>
+</html>
diff --git a/tags/cfp/index.html b/tags/cfp/index.html
new file mode 100644
index 00000000..8adf2f5a
--- /dev/null
+++ b/tags/cfp/index.html
@@ -0,0 +1,1275 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>cfp</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">cfp</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">cfp</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/cfp/index.xml b/tags/cfp/index.xml
new file mode 100644
index 00000000..de0f97d5
--- /dev/null
+++ b/tags/cfp/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>cfp on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/cfp/</link>
+    <description>Recent content in cfp on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/cfp/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/cfp/page/1/index.html b/tags/cfp/page/1/index.html
new file mode 100644
index 00000000..b78561ab
--- /dev/null
+++ b/tags/cfp/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/cfp/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/cfp/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/cfp/">
+  </head>
+</html>
diff --git a/tags/chile/index.html b/tags/chile/index.html
new file mode 100644
index 00000000..68686f21
--- /dev/null
+++ b/tags/chile/index.html
@@ -0,0 +1,1280 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Chile</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Chile</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Chile</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">Seventeenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    , SANTIAGO
+    , CHILE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El Bosque Ebro</strong> (<a href="https://www.plazaelbosque.cl">https://www.plazaelbosque.cl</a>), which is two blocks away from SIGMOD&rsquo;s venue. See the map <a href="https://maps.app.goo.gl/78oiw3zo2pH3gy5R6">here</a>.</p>
+<p><strong>If you would like to participate please register using <a href="https://forms.gle/XXgaQfwBZAMMZJb78">this form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in Chile time (GMT-4).</strong></p>
+<p><strong>Each speaker will …</strong></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/chile/index.xml b/tags/chile/index.xml
new file mode 100644
index 00000000..81662fbb
--- /dev/null
+++ b/tags/chile/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Chile on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/chile/</link>
+    <description>Recent content in Chile on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 09 Jun 2024 09:00:00 -0400</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/chile/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/chile/page/1/index.html b/tags/chile/page/1/index.html
new file mode 100644
index 00000000..1155cb6d
--- /dev/null
+++ b/tags/chile/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/chile/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/chile/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/chile/">
+  </head>
+</html>
diff --git a/tags/database/index.html b/tags/database/index.html
new file mode 100644
index 00000000..e911f500
--- /dev/null
+++ b/tags/database/index.html
@@ -0,0 +1,1274 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>database</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">database</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">database</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/database/index.xml b/tags/database/index.xml
new file mode 100644
index 00000000..f910e0ea
--- /dev/null
+++ b/tags/database/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>database on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/database/</link>
+    <description>Recent content in database on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 14 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/database/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/database/page/1/index.html b/tags/database/page/1/index.html
new file mode 100644
index 00000000..6e19077d
--- /dev/null
+++ b/tags/database/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/database/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/database/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/database/">
+  </head>
+</html>
diff --git a/tags/datagen/index.html b/tags/datagen/index.html
new file mode 100644
index 00000000..63a1e402
--- /dev/null
+++ b/tags/datagen/index.html
@@ -0,0 +1,1444 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>datagen</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">datagen</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">datagen</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/datagen/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/datagen/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/datagen/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/datagen/page/2/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/datagen/index.xml b/tags/datagen/index.xml
new file mode 100644
index 00000000..7b6f01de
--- /dev/null
+++ b/tags/datagen/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>datagen on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/datagen/</link>
+    <description>Recent content in datagen on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 15 Feb 2023 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/datagen/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/datagen/page/1/index.html b/tags/datagen/page/1/index.html
new file mode 100644
index 00000000..4ed0f143
--- /dev/null
+++ b/tags/datagen/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/datagen/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/datagen/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/datagen/">
+  </head>
+</html>
diff --git a/tags/datagen/page/2/index.html b/tags/datagen/page/2/index.html
new file mode 100644
index 00000000..43448ac4
--- /dev/null
+++ b/tags/datagen/page/2/index.html
@@ -0,0 +1,1441 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>datagen</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">datagen</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">datagen</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/datagen/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/datagen/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/datagen/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/datagen/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/design/index.html b/tags/design/index.html
new file mode 100644
index 00000000..22a3a9bf
--- /dev/null
+++ b/tags/design/index.html
@@ -0,0 +1,1274 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>design</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">design</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">design</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/choke-point-based-benchmark-design/">Choke Point Based Benchmark Design</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATABASE
+    , BENCHMARK
+    , DESIGN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <em>Linked Data Benchmark Council</em> (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its <a href="https://ldbcouncil.org">https://ldbcouncil.org</a> website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/design/index.xml b/tags/design/index.xml
new file mode 100644
index 00000000..185538ce
--- /dev/null
+++ b/tags/design/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>design on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/design/</link>
+    <description>Recent content in design on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 14 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/design/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/design/page/1/index.html b/tags/design/page/1/index.html
new file mode 100644
index 00000000..fd6cd249
--- /dev/null
+++ b/tags/design/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/design/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/design/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/design/">
+  </head>
+</html>
diff --git a/tags/developer/index.html b/tags/developer/index.html
new file mode 100644
index 00000000..32ff5a99
--- /dev/null
+++ b/tags/developer/index.html
@@ -0,0 +1,1342 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>developer</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">developer</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">developer</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/developer/index.xml b/tags/developer/index.xml
new file mode 100644
index 00000000..35f2b80c
--- /dev/null
+++ b/tags/developer/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>developer on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/developer/</link>
+    <description>Recent content in developer on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 18 Feb 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/developer/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/developer/page/1/index.html b/tags/developer/page/1/index.html
new file mode 100644
index 00000000..b8aac574
--- /dev/null
+++ b/tags/developer/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/developer/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/developer/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/developer/">
+  </head>
+</html>
diff --git a/tags/driver/index.html b/tags/driver/index.html
new file mode 100644
index 00000000..d43c1227
--- /dev/null
+++ b/tags/driver/index.html
@@ -0,0 +1,1339 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>driver</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">driver</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">driver</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/driver/index.xml b/tags/driver/index.xml
new file mode 100644
index 00000000..40045eff
--- /dev/null
+++ b/tags/driver/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>driver on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/driver/</link>
+    <description>Recent content in driver on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 21 Apr 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/driver/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/driver/page/1/index.html b/tags/driver/page/1/index.html
new file mode 100644
index 00000000..78168cfe
--- /dev/null
+++ b/tags/driver/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/driver/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/driver/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/driver/">
+  </head>
+</html>
diff --git a/tags/ec2/index.html b/tags/ec2/index.html
new file mode 100644
index 00000000..ccd27dc5
--- /dev/null
+++ b/tags/ec2/index.html
@@ -0,0 +1,1276 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>ec2</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">ec2</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">ec2</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/ec2/index.xml b/tags/ec2/index.xml
new file mode 100644
index 00000000..f7e85540
--- /dev/null
+++ b/tags/ec2/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>ec2 on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/ec2/</link>
+    <description>Recent content in ec2 on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 17 Dec 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/ec2/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/ec2/page/1/index.html b/tags/ec2/page/1/index.html
new file mode 100644
index 00000000..5da1450d
--- /dev/null
+++ b/tags/ec2/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/ec2/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/ec2/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/ec2/">
+  </head>
+</html>
diff --git a/tags/finbench/index.html b/tags/finbench/index.html
new file mode 100644
index 00000000..cc2bdf52
--- /dev/null
+++ b/tags/finbench/index.html
@@ -0,0 +1,1293 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>finbench</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">finbench</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">finbench</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/">Announcing the Official Release of LDBC Financial Benchmark v0.1.0</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the official release of the initial version (v0.1.0) of <a href="/benchmarks/finbench/">Financial Benchmark (FinBench)</a>.</p>
+<p>The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the <a href="/benchmarks/finbench/ldbc-finbench-work-charter.pdf">LDBC FinBench Task Force</a>. The benchmark has one workload currently, <strong>Transaction Workload</strong>, capturing OLTP scenario with complex read queries that access the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/">Announcing the LDBC Financial Benchmark Task Force</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FINBENCH
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are delighted to announce the set up of the <a href="/benchmarks/finbench/">Financial Benchmark (FinBench) task force</a>.</p>
+<p>The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/finbench/index.xml b/tags/finbench/index.xml
new file mode 100644
index 00000000..c4fe186a
--- /dev/null
+++ b/tags/finbench/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>finbench on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/finbench/</link>
+    <description>Recent content in finbench on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 27 Jun 2023 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/finbench/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/finbench/page/1/index.html b/tags/finbench/page/1/index.html
new file mode 100644
index 00000000..a37d0bd5
--- /dev/null
+++ b/tags/finbench/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/finbench/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/finbench/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/finbench/">
+  </head>
+</html>
diff --git a/tags/flink/index.html b/tags/flink/index.html
new file mode 100644
index 00000000..9958c326
--- /dev/null
+++ b/tags/flink/index.html
@@ -0,0 +1,1276 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>flink</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">flink</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">flink</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/flink/index.xml b/tags/flink/index.xml
new file mode 100644
index 00000000..65b2898f
--- /dev/null
+++ b/tags/flink/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>flink on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/flink/</link>
+    <description>Recent content in flink on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Mon, 16 Nov 2015 14:47:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/flink/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/flink/page/1/index.html b/tags/flink/page/1/index.html
new file mode 100644
index 00000000..d6b1bfd4
--- /dev/null
+++ b/tags/flink/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/flink/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/flink/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/flink/">
+  </head>
+</html>
diff --git a/tags/gql/index.html b/tags/gql/index.html
new file mode 100644
index 00000000..a1039635
--- /dev/null
+++ b/tags/gql/index.html
@@ -0,0 +1,1273 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>GQL</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">GQL</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">GQL</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/">Launching open-source language tools for ISO/IEC GQL</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    GQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this <a href="https://ldbcouncil.org/pages/opengql-announce">announcement from Alastair Green, Vice-chair of LDBC</a>.</p>
+<p>These tools are the work of the <strong>LDBC GQL Implementation Working Group</strong>, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/gql/index.xml b/tags/gql/index.xml
new file mode 100644
index 00000000..a24920a7
--- /dev/null
+++ b/tags/gql/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>GQL on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/gql/</link>
+    <description>Recent content in GQL on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 May 2024 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/gql/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/gql/page/1/index.html b/tags/gql/page/1/index.html
new file mode 100644
index 00000000..eff11a69
--- /dev/null
+++ b/tags/gql/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/gql/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/gql/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/gql/">
+  </head>
+</html>
diff --git a/tags/grades/index.html b/tags/grades/index.html
new file mode 100644
index 00000000..f6ce90c9
--- /dev/null
+++ b/tags/grades/index.html
@@ -0,0 +1,1302 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>grades</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">grades</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">grades</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/grades/index.xml b/tags/grades/index.xml
new file mode 100644
index 00000000..948ae6c3
--- /dev/null
+++ b/tags/grades/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>grades on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/grades/</link>
+    <description>Recent content in grades on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 29 May 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/grades/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/grades/page/1/index.html b/tags/grades/page/1/index.html
new file mode 100644
index 00000000..d11149a5
--- /dev/null
+++ b/tags/grades/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/grades/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/grades/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/grades/">
+  </head>
+</html>
diff --git a/tags/graphalytics/index.html b/tags/graphalytics/index.html
new file mode 100644
index 00000000..e6f4bf2a
--- /dev/null
+++ b/tags/graphalytics/index.html
@@ -0,0 +1,1382 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>graphalytics</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">graphalytics</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">graphalytics</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/graphalytics/index.xml b/tags/graphalytics/index.xml
new file mode 100644
index 00000000..4117fa32
--- /dev/null
+++ b/tags/graphalytics/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>graphalytics on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/graphalytics/</link>
+    <description>Recent content in graphalytics on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 06 Sep 2016 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/graphalytics/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/graphalytics/page/1/index.html b/tags/graphalytics/page/1/index.html
new file mode 100644
index 00000000..acf4c217
--- /dev/null
+++ b/tags/graphalytics/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/graphalytics/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/graphalytics/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/graphalytics/">
+  </head>
+</html>
diff --git a/tags/guide/index.html b/tags/guide/index.html
new file mode 100644
index 00000000..b84d8936
--- /dev/null
+++ b/tags/guide/index.html
@@ -0,0 +1,1277 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>guide</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">guide</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">guide</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/guide/index.xml b/tags/guide/index.xml
new file mode 100644
index 00000000..c841386a
--- /dev/null
+++ b/tags/guide/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>guide on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/guide/</link>
+    <description>Recent content in guide on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 13 Jan 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/guide/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/guide/page/1/index.html b/tags/guide/page/1/index.html
new file mode 100644
index 00000000..62017db8
--- /dev/null
+++ b/tags/guide/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/guide/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/guide/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/guide/">
+  </head>
+</html>
diff --git a/tags/index.html b/tags/index.html
new file mode 100644
index 00000000..1892a75a
--- /dev/null
+++ b/tags/index.html
@@ -0,0 +1,1253 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Tags</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Tags</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Tags</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/index.xml b/tags/index.xml
new file mode 100644
index 00000000..8e562d0d
--- /dev/null
+++ b/tags/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Tags on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/</link>
+    <description>Recent content in Tags on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 30 Aug 2024 09:00:00 -0800</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/industry/index.html b/tags/industry/index.html
new file mode 100644
index 00000000..5e30a70c
--- /dev/null
+++ b/tags/industry/index.html
@@ -0,0 +1,1340 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>industry</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">industry</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">industry</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/">OWL-Empowered SPARQL Query Optimization</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/">DATAGEN: a Realistic Social Network Data Generator</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/getting-started-with-snb">Getting started with snb</a>, <a href="/post/datagen-data-generation-for-the-social-network-benchmark">DATAGEN: data generation for the Social Network Benchmark</a>), Arnau Prat discussed the main features and characteristics of DATAGEN: <em>realism</em>, <em>scalability</em>, <em>determinism</em>, <em>usability</em>. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/">New Website Online LDBC Benchmarks Reach Public Draft</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , INDUSTRY
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/industry/index.xml b/tags/industry/index.xml
new file mode 100644
index 00000000..ee13d183
--- /dev/null
+++ b/tags/industry/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>industry on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/industry/</link>
+    <description>Recent content in industry on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 03 Mar 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/industry/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/industry/page/1/index.html b/tags/industry/page/1/index.html
new file mode 100644
index 00000000..c1354497
--- /dev/null
+++ b/tags/industry/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/industry/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/industry/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/industry/">
+  </head>
+</html>
diff --git a/tags/instance-matching/index.html b/tags/instance-matching/index.html
new file mode 100644
index 00000000..2360fa4b
--- /dev/null
+++ b/tags/instance-matching/index.html
@@ -0,0 +1,1294 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>instance matching</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">instance matching</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">instance matching</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/">Semantic Publishing Instance Matching Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , BENCHMARK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.</p>
+<p>The SPIMBench …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/instance-matching/index.xml b/tags/instance-matching/index.xml
new file mode 100644
index 00000000..35f8e371
--- /dev/null
+++ b/tags/instance-matching/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>instance matching on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/instance-matching/</link>
+    <description>Recent content in instance matching on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 16 Jun 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/instance-matching/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/instance-matching/page/1/index.html b/tags/instance-matching/page/1/index.html
new file mode 100644
index 00000000..921614dc
--- /dev/null
+++ b/tags/instance-matching/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/instance-matching/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/instance-matching/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/instance-matching/">
+  </head>
+</html>
diff --git a/tags/interactive/index.html b/tags/interactive/index.html
new file mode 100644
index 00000000..78e7d229
--- /dev/null
+++ b/tags/interactive/index.html
@@ -0,0 +1,1449 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>interactive</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">interactive</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">interactive</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/interactive/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/interactive/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/interactive/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/interactive/page/2/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/interactive/index.xml b/tags/interactive/index.xml
new file mode 100644
index 00000000..35f1f074
--- /dev/null
+++ b/tags/interactive/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>interactive on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/interactive/</link>
+    <description>Recent content in interactive on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Wed, 10 Jun 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/interactive/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/interactive/page/1/index.html b/tags/interactive/page/1/index.html
new file mode 100644
index 00000000..90599f80
--- /dev/null
+++ b/tags/interactive/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/interactive/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/interactive/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/interactive/">
+  </head>
+</html>
diff --git a/tags/interactive/page/2/index.html b/tags/interactive/page/2/index.html
new file mode 100644
index 00000000..10bd4437
--- /dev/null
+++ b/tags/interactive/page/2/index.html
@@ -0,0 +1,1451 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>interactive</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">interactive</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">interactive</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/interactive/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/interactive/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/interactive/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/interactive/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/ldbc/index.html b/tags/ldbc/index.html
new file mode 100644
index 00000000..60487701
--- /dev/null
+++ b/tags/ldbc/index.html
@@ -0,0 +1,1297 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>ldbc</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">ldbc</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">ldbc</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/">Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>It is with great pleasure that we announce the new LDBC organisation site at <a href="https://www.ldbcouncil.org">www.ldbcouncil.org</a>. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/ldbc/index.xml b/tags/ldbc/index.xml
new file mode 100644
index 00000000..d1c67466
--- /dev/null
+++ b/tags/ldbc/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>ldbc on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/ldbc/</link>
+    <description>Recent content in ldbc on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 14 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/ldbc/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/ldbc/page/1/index.html b/tags/ldbc/page/1/index.html
new file mode 100644
index 00000000..ed089d1d
--- /dev/null
+++ b/tags/ldbc/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/ldbc/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/ldbc/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/ldbc/">
+  </head>
+</html>
diff --git a/tags/page/1/index.html b/tags/page/1/index.html
new file mode 100644
index 00000000..25554348
--- /dev/null
+++ b/tags/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/">
+  </head>
+</html>
diff --git a/tags/rdf/index.html b/tags/rdf/index.html
new file mode 100644
index 00000000..60d56671
--- /dev/null
+++ b/tags/rdf/index.html
@@ -0,0 +1,1325 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>rdf</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">rdf</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">rdf</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/rdf/index.xml b/tags/rdf/index.xml
new file mode 100644
index 00000000..1c92e2c0
--- /dev/null
+++ b/tags/rdf/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>rdf on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/rdf/</link>
+    <description>Recent content in rdf on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 13 Jan 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/rdf/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/rdf/page/1/index.html b/tags/rdf/page/1/index.html
new file mode 100644
index 00000000..cdf50415
--- /dev/null
+++ b/tags/rdf/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/rdf/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/rdf/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/rdf/">
+  </head>
+</html>
diff --git a/tags/santiago/index.html b/tags/santiago/index.html
new file mode 100644
index 00000000..e42da6f5
--- /dev/null
+++ b/tags/santiago/index.html
@@ -0,0 +1,1280 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>Santiago</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">Santiago</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">Santiago</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">Seventeenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    , SANTIAGO
+    , CHILE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El Bosque Ebro</strong> (<a href="https://www.plazaelbosque.cl">https://www.plazaelbosque.cl</a>), which is two blocks away from SIGMOD&rsquo;s venue. See the map <a href="https://maps.app.goo.gl/78oiw3zo2pH3gy5R6">here</a>.</p>
+<p><strong>If you would like to participate please register using <a href="https://forms.gle/XXgaQfwBZAMMZJb78">this form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in Chile time (GMT-4).</strong></p>
+<p><strong>Each speaker will …</strong></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/santiago/index.xml b/tags/santiago/index.xml
new file mode 100644
index 00000000..d3f2ef74
--- /dev/null
+++ b/tags/santiago/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>Santiago on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/santiago/</link>
+    <description>Recent content in Santiago on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 09 Jun 2024 09:00:00 -0400</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/santiago/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/santiago/page/1/index.html b/tags/santiago/page/1/index.html
new file mode 100644
index 00000000..035ca2cd
--- /dev/null
+++ b/tags/santiago/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/santiago/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/santiago/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/santiago/">
+  </head>
+</html>
diff --git a/tags/sesame/index.html b/tags/sesame/index.html
new file mode 100644
index 00000000..168e35d0
--- /dev/null
+++ b/tags/sesame/index.html
@@ -0,0 +1,1277 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>sesame</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">sesame</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">sesame</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/sesame/index.xml b/tags/sesame/index.xml
new file mode 100644
index 00000000..16a95750
--- /dev/null
+++ b/tags/sesame/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>sesame on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/sesame/</link>
+    <description>Recent content in sesame on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 13 Jan 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/sesame/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/sesame/page/1/index.html b/tags/sesame/page/1/index.html
new file mode 100644
index 00000000..8d50ebe4
--- /dev/null
+++ b/tags/sesame/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/sesame/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/sesame/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/sesame/">
+  </head>
+</html>
diff --git a/tags/sigmod/index.html b/tags/sigmod/index.html
new file mode 100644
index 00000000..70537ae2
--- /dev/null
+++ b/tags/sigmod/index.html
@@ -0,0 +1,1302 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>sigmod</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">sigmod</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">sigmod</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/sigmod/index.xml b/tags/sigmod/index.xml
new file mode 100644
index 00000000..719b6429
--- /dev/null
+++ b/tags/sigmod/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>sigmod on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/sigmod/</link>
+    <description>Recent content in sigmod on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 29 May 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/sigmod/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/sigmod/page/1/index.html b/tags/sigmod/page/1/index.html
new file mode 100644
index 00000000..ec31e39d
--- /dev/null
+++ b/tags/sigmod/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/sigmod/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/sigmod/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/sigmod/">
+  </head>
+</html>
diff --git a/tags/snb/index.html b/tags/snb/index.html
new file mode 100644
index 00000000..b1679fe3
--- /dev/null
+++ b/tags/snb/index.html
@@ -0,0 +1,1497 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>snb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">snb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">snb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">Record-Breaking SNB Interactive Results for GraphScope</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are happy to annonunce new <a href="/benchmarks/snb-interactive/">audited results for the SNB Interactive workload</a>, achieved by the open-source <a href="https://github.com/alibaba/GraphScope">GraphScope Flex</a> system.</p>
+<p>The current audit of the system has broken several records:</p>
+<ul>
+<li>It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.</li>
+<li>It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.</li>
+<li>It is the first system to successfully complete the benchmark on …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/">LDBC SNB – Early 2023 updates</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>2023 has been an eventful year for us so far. Here is a summary of our recent activities.</p>
+<ol>
+<li>
+<p>Our paper <a href="https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf">The LDBC Social Network Benchmark: Business Intelligence Workload</a> was published in PVLDB.</p>
+</li>
+<li>
+<p>David Püroja just completed his MSc thesis on creating a design towards <a href="https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf">SNB Interactive v2</a> at CWI&rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&rsquo;s graph developer room titled <a href="https://fosdem.org/2023/schedule/event/graph_ldbc/">The LDBC Social Network …</a></p></li></ol>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/">LDBC SNB Datagen – The winding path to SF100K</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my <a href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">last technical update</a> on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/">Speeding Up LDBC SNB Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="#references">Social Network Benchmark [4]</a> (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-and-apache-flink/">LDBC and Apache Flink</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    FLINK
+    , DATAGEN
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Apache Flink <a href="#references">[1]</a> is an open source platform for distributed stream and batch data processing. Flink&rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.</p>
+<p><img src="https://flink.apache.org/img/flink-stack-small.png" alt=""></p>
+<p>Flink offers multiple APIs to process data …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/">SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this post we will look at running the <a href="/developer/snb">LDBC SNB</a> on <a href="https://virtuoso.openlinksw.com/">Virtuoso</a>.</p>
+<p>First, let&rsquo;s recap what the benchmark is about:</p>
+<ol>
+<li>
+<p>fairly frequent short updates, with no update contention worth mentioning</p>
+</li>
+<li>
+<p>short random lookups</p>
+</li>
+<li>
+<p>medium complex queries centered around a person&rsquo;s social environment</p>
+</li>
+</ol>
+<p>The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/snb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/page/5/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/snb/index.xml b/tags/snb/index.xml
new file mode 100644
index 00000000..fe4d207a
--- /dev/null
+++ b/tags/snb/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>snb on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/snb/</link>
+    <description>Recent content in snb on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 26 May 2024 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/snb/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/snb/page/1/index.html b/tags/snb/page/1/index.html
new file mode 100644
index 00000000..867829db
--- /dev/null
+++ b/tags/snb/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/snb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/snb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/snb/">
+  </head>
+</html>
diff --git a/tags/snb/page/2/index.html b/tags/snb/page/2/index.html
new file mode 100644
index 00000000..bf2ed571
--- /dev/null
+++ b/tags/snb/page/2/index.html
@@ -0,0 +1,1498 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>snb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">snb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">snb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/">Why Do We Need an LDBC SNB-Specific Workload Driver?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous <a href="/tags/driver">3-part blog series</a> we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/page/5/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/snb/page/3/index.html b/tags/snb/page/3/index.html
new file mode 100644
index 00000000..515ccd44
--- /dev/null
+++ b/tags/snb/page/3/index.html
@@ -0,0 +1,1491 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>snb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">snb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">snb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/">Person Activity Subgraph Features in LDBC DATAGEN</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/">SNB Driver - Part 2: Tracking Dependencies Between Queries</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The <a href="/post/snb-driver-part-1">SNB Driver part 1</a> post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&rsquo;ll drill down deeper into the details of what it means to execute &ldquo;dependent queries&rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/">SNB Driver - Part 3: Workload Execution Putting It All Together</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Up until now we have introduced the <a href="/post/snb-driver-part-1">challenges faced when executing the LDBC SNB benchmark</a>, as well as explained <a href="/post/snb-driver-part-2-tracking-dependencies-between-queries">how some of these are overcome</a>. With the foundations laid, we can now explain precisely how operations are executed.</p>
+<p>Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/">Further Developments in SNB BI Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BI
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.</p>
+<p>As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.</p>
+<p>There are obvious marketing applications for a SNB-like dataset. There are also security …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/page/5/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/snb/page/4/index.html b/tags/snb/page/4/index.html
new file mode 100644
index 00000000..c96e1f6b
--- /dev/null
+++ b/tags/snb/page/4/index.html
@@ -0,0 +1,1505 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>snb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">snb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">snb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/social-network-benchmark-goals/">Social Network Benchmark Goals</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DATAGEN
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-snb/">Getting Started With SNB</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    , DATAGEN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In a previous blog post titled &ldquo;<a href="/post/is-snb-like-facebooks-linkbench/">Is SNB like Facebook&rsquo;s LinkBench?</a>&rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.</p>
+<h3 id="datagen">DATAGEN</h3>
+<p>DATAGEN is the data generator used by all the workloads of SNB. <a href="/post/datagen-data-generation-for-the-social-network-benchmark/">Here</a> we introduced the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/">Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.</p>
+<p>The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&rsquo;s social environment and potentially access data associated with the friends or a user and their friends.</p>
+<p>This …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/">Is SNB Like Facebooks LinkBench</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DEVELOPER
+    , SNB
+    , INTERACTIVE
+    , BI
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" onerror="this.src='https:\/\/ldbcouncil.org\/post\/is-snb-like-facebooks-linkbench\/SNB-workloads-vs-systems.jpg'" alt="post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/is-snb-like-facebooks-linkbench/SNB-workloads-vs-systems.jpg" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>In this post, I will discuss in some detail the rationale and goals of the design of the <a href="/benchmarks/snb">Social Network Benchmark</a> (SNB) and explain how it relates to real …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/page/5/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/snb/page/5/index.html b/tags/snb/page/5/index.html
new file mode 100644
index 00000000..d08225cf
--- /dev/null
+++ b/tags/snb/page/5/index.html
@@ -0,0 +1,1394 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>snb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">snb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">snb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-day-of-graph-analytics/">The Day of Graph Analytics</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    ANALYTICS
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Note: consider this post as a continuation of the &ldquo;<a href="/post/making-it-interactive">Making it interactive</a>&rdquo; post by Orri Erling.</em></p>
+<p>I have now completed the <a href="https://github.com/openlink/virtuoso-opensource">Virtuoso</a> TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. <a href="http://www.tpc.org/tpch/">TPC-H</a> is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/snb/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/snb/page/4/" class="page-link hover-ripple">
+                        4
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/snb/page/5/" class="page-link hover-ripple">
+                        5
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/social-network/index.html b/tags/social-network/index.html
new file mode 100644
index 00000000..e7cda72b
--- /dev/null
+++ b/tags/social-network/index.html
@@ -0,0 +1,1342 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>social network</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">social network</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">social network</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/">Event Driven Post Generation in Datagen</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.</p>
+<p>First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/">The LDBC Datagen Community Structure</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.</p>
+<p>When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/">DATAGEN: Data Generation for the Social Network Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SOCIAL NETWORK
+    , SNB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 <a href="#references">[1]</a>.</p>
+<p>One of the most …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-data-generator-getting-started/">SNB Data Generator - Getting Started</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    DATAGEN
+    , SNB
+    , SOCIAL NETWORK
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In previous posts (<a href="/post/datagen-data-generation-for-the-social-network-benchmark">this</a> and <a href="/post/getting-started-with-snb">this</a>) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.</p>
+<h3 id="getting-and-configuring-hadoop">Getting and Configuring Hadoop</h3>
+<p>DATAGEN runs on top of hadoop 1.2.1  to be scale. …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/social-network/index.xml b/tags/social-network/index.xml
new file mode 100644
index 00000000..e6bf16b3
--- /dev/null
+++ b/tags/social-network/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>social network on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/social-network/</link>
+    <description>Recent content in social network on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 10 Apr 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/social-network/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/social-network/page/1/index.html b/tags/social-network/page/1/index.html
new file mode 100644
index 00000000..a8548986
--- /dev/null
+++ b/tags/social-network/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/social-network/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/social-network/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/social-network/">
+  </head>
+</html>
diff --git a/tags/sparql/index.html b/tags/sparql/index.html
new file mode 100644
index 00000000..36a91f76
--- /dev/null
+++ b/tags/sparql/index.html
@@ -0,0 +1,1297 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>sparql</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">sparql</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">sparql</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/sparql/index.xml b/tags/sparql/index.xml
new file mode 100644
index 00000000..a56f1886
--- /dev/null
+++ b/tags/sparql/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>sparql on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/sparql/</link>
+    <description>Recent content in sparql on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Sun, 09 Nov 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/sparql/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/sparql/page/1/index.html b/tags/sparql/page/1/index.html
new file mode 100644
index 00000000..6336a3e7
--- /dev/null
+++ b/tags/sparql/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/sparql/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/sparql/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/sparql/">
+  </head>
+</html>
diff --git a/tags/spb/index.html b/tags/spb/index.html
new file mode 100644
index 00000000..45972f53
--- /dev/null
+++ b/tags/spb/index.html
@@ -0,0 +1,1443 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>spb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">spb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">spb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/">Elements of Instance Matching Benchmarks: a Short Overview</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INSTANCE MATCHING
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/">Industry Relevance of the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    INDUSTRY
+    , SPB
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" onerror="this.src='https:\/\/ldbcouncil.org\/post\/industry-relevance-of-the-semantic-publishing-benchmark\/01_sf_newspapers.png'" alt="post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/industry-relevance-of-the-semantic-publishing-benchmark/01_sf_newspapers.png" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <h3 id="publishing-and-media-businesses-are-going-through-transformation">Publishing and media businesses are going through transformation</h3>
+<p>I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/">Sizing AWS Instances for the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , AMAZON
+    , EC2
+    , AWS
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC&rsquo;s <a href="/developer/spb">Semantic Publishing Benchmark</a> (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous <a href="http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html">BBC Dynamic Semantic Publishing</a> scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/">Getting Started With the Semantic Publishing Benchmark</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SPARQL
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/spb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/spb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/spb/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/spb/page/2/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/spb/index.xml b/tags/spb/index.xml
new file mode 100644
index 00000000..18643f4e
--- /dev/null
+++ b/tags/spb/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>spb on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/spb/</link>
+    <description>Recent content in spb on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 16 Jun 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/spb/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/spb/page/1/index.html b/tags/spb/page/1/index.html
new file mode 100644
index 00000000..56484985
--- /dev/null
+++ b/tags/spb/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/spb/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/spb/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/spb/">
+  </head>
+</html>
diff --git a/tags/spb/page/2/index.html b/tags/spb/page/2/index.html
new file mode 100644
index 00000000..f896d173
--- /dev/null
+++ b/tags/spb/page/2/index.html
@@ -0,0 +1,1333 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>spb</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">spb</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">spb</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/">Using LDBC SPB to Find OWLIM Performance Issues</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    LDBC
+    , SPB
+    , RDF
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC <a href="/developer/spb">Semantic Publishing Benchmark</a> (LDBC-SPB) as a part of our development and release process.</p>
+<p>First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.</p>
+<p>Initially we’ve decided to fix some of the benchmark parameters :</p>
+<ul>
+<li>the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/spb/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/spb/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/spb/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/spb/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/test-run/index.html b/tags/test-run/index.html
new file mode 100644
index 00000000..3ce7bb02
--- /dev/null
+++ b/tags/test-run/index.html
@@ -0,0 +1,1274 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>test run</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">test run</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">test run</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/">Making Semantic Publishing Execution Rules</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , TEST RUN
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="https://ldbcouncil.org/">LDBC</a> <a href="/benchmarks/spb">SPB (Semantic Publishing Benchmark)</a> is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an <a href="https://www.ontotext.com/products/ontotext-graphdb-owlim/">Ontotext Graph DB</a> deployment. Graph DB was formerly known as Owlim.</p>
+<p>So, in SPB we wanted to address substantially more complex queries than the lookups that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/test-run/index.xml b/tags/test-run/index.xml
new file mode 100644
index 00000000..ac40a26d
--- /dev/null
+++ b/tags/test-run/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>test run on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/test-run/</link>
+    <description>Recent content in test run on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 18 Nov 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/test-run/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/test-run/page/1/index.html b/tags/test-run/page/1/index.html
new file mode 100644
index 00000000..b25dd771
--- /dev/null
+++ b/tags/test-run/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/test-run/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/test-run/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/test-run/">
+  </head>
+</html>
diff --git a/tags/tpc-c/index.html b/tags/tpc-c/index.html
new file mode 100644
index 00000000..d1364257
--- /dev/null
+++ b/tags/tpc-c/index.html
@@ -0,0 +1,1275 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>tpc c</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">tpc-c</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">tpc-c</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-driver-part-1/">SNB Driver - Part 1</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , DRIVER
+    , TPC-C
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tpc-c/index.xml b/tags/tpc-c/index.xml
new file mode 100644
index 00000000..44e47c59
--- /dev/null
+++ b/tags/tpc-c/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>tpc-c on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/tpc-c/</link>
+    <description>Recent content in tpc-c on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 27 Nov 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/tpc-c/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/tpc-c/page/1/index.html b/tags/tpc-c/page/1/index.html
new file mode 100644
index 00000000..ab57a782
--- /dev/null
+++ b/tags/tpc-c/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/tpc-c/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/tpc-c/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/tpc-c/">
+  </head>
+</html>
diff --git a/tags/tpc/index.html b/tags/tpc/index.html
new file mode 100644
index 00000000..15e1152b
--- /dev/null
+++ b/tags/tpc/index.html
@@ -0,0 +1,1277 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>tpc</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">tpc</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">tpc</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/making-it-interactive/">Making It Interactive</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , BENCHMARKING
+    , TPC
+    , SPARQL
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><em>Synopsis:</em> Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.</p>
+<p>It is about to be showtime for LDBC. The initial installment of the …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tpc/index.xml b/tags/tpc/index.xml
new file mode 100644
index 00000000..1cb202a6
--- /dev/null
+++ b/tags/tpc/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>tpc on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/tpc/</link>
+    <description>Recent content in tpc on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Thu, 09 Oct 2014 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/tpc/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/tpc/page/1/index.html b/tags/tpc/page/1/index.html
new file mode 100644
index 00000000..024d74bb
--- /dev/null
+++ b/tags/tpc/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/tpc/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/tpc/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/tpc/">
+  </head>
+</html>
diff --git a/tags/tu-delft/index.html b/tags/tu-delft/index.html
new file mode 100644
index 00000000..517d1b5e
--- /dev/null
+++ b/tags/tu-delft/index.html
@@ -0,0 +1,1281 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>tu delft</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">tu delft</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">tu delft</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/">LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    BENCHMARK
+    , TU DELFT
+    , GRAPHALYTICS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+    
+    <img src="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" onerror="this.src='https:\/\/ldbcouncil.org\/post\/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification\/image2.JPG'" alt="post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="img-fluid w-100" style="object-fit: contain">
+    <div class="hover-overlay">
+      <a href="/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/image2.JPG" class="venobox"><i class="uni-plus"></i></a>
+    </div>
+    
+    <p>LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.</p>
+<p>LDBC Graphalytics is the first industry-grade graph data management benchmark …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tu-delft/index.xml b/tags/tu-delft/index.xml
new file mode 100644
index 00000000..09136df2
--- /dev/null
+++ b/tags/tu-delft/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>tu delft on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/tu-delft/</link>
+    <description>Recent content in tu delft on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 06 Sep 2016 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/tu-delft/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/tu-delft/page/1/index.html b/tags/tu-delft/page/1/index.html
new file mode 100644
index 00000000..8ba27b5b
--- /dev/null
+++ b/tags/tu-delft/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/tu-delft/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/tu-delft/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/tu-delft/">
+  </head>
+</html>
diff --git a/tags/tuc-meeting/index.html b/tags/tuc-meeting/index.html
new file mode 100644
index 00000000..43f33e49
--- /dev/null
+++ b/tags/tuc-meeting/index.html
@@ -0,0 +1,1459 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">Eighteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located in <strong>Guangzhou</strong> with <a href="https://vldb.org/2024/">VLDB 2024</a> on <strong>August 30-31 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/aVPrrcxXpSwrWPnh6">our form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in PDT.</strong></p>
+<h4 id="august-30-friday">August 30, Friday …</h4>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">Seventeenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    , SANTIAGO
+    , CHILE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Renzo Angles, Sebastián Ferrada</p>
+<p>LDBC is hosting a one-day in-person workshop, co-located in <strong>Santiago de Chile</strong> with <a href="https://2024.sigmod.org/venue.shtml">SIGMOD 2024</a> on <strong>June 9 (Sunday)</strong>.</p>
+<p>The workshop will be held in the <strong>Hotel Plaza El Bosque Ebro</strong> (<a href="https://www.plazaelbosque.cl">https://www.plazaelbosque.cl</a>), which is two blocks away from SIGMOD&rsquo;s venue. See the map <a href="https://maps.app.goo.gl/78oiw3zo2pH3gy5R6">here</a>.</p>
+<p><strong>If you would like to participate please register using <a href="https://forms.gle/XXgaQfwBZAMMZJb78">this form</a>.</strong></p>
+<h3 id="program">Program</h3>
+<p><strong>All times are in Chile time (GMT-4).</strong></p>
+<p><strong>Each speaker will …</strong></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/sixteenth-tuc-meeting/">Sixteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Oskar van Rest, Alastair Green, Gábor Szárnyas</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2023.sigmod.org/venue.shtml">SIGMOD 2023</a> on <strong>June 23-24 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10- and 15-minute talks followed by a Q&amp;A session. The talks will be recorded and made available online. <strong>If you would like to participate please register using <a href="https://forms.gle/T6bwVHzK9V5FaKyR9">our form</a>.</strong></p>
+<p>LDBC will host a <strong>social event</strong> on Friday at the <a href="https://www.blackbottleseattle.com/">Black Bottle gastrotavern</a> in Belltown: …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fifteenth-tuc-meeting/">Fifteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><strong>Organizers:</strong> Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green</p>
+<p>LDBC is hosting a <strong>two-day</strong> hybrid workshop, co-located with <a href="https://2022.sigmod.org/venue.shtml">SIGMOD 2022</a> on <strong>June 17-18 (Friday-Saturday)</strong>.</p>
+<p>The program consists of 10-15 minute talks followed by a Q&amp;A session. The talks will be recorded and made available online.<br>
+The tenative program is the following. <strong>All times are in EDT.</strong></p>
+<p>We will have a social event on Friday at 17:30 at <a href="https://elvezrestaurant.com/">El Vez</a> (<a href="https://g.page/ElVezPhilly">Google Maps</a>).</p>
+<h4 id="friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml">Friday ( …</h4>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fourteenth-tuc-meeting/">Fourteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC was hosting a one-day hybrid workshop, co-located with <a href="https://vldb.org/2021/">VLDB 2021</a> on <strong>August 16 (Monday) between 16:00–20:00 CEST</strong>.</p>
+<p>The physical part of the workshop was held in room Akvariet 2 of the <a href="https://www.tivolihotel.com/">Tivoli Hotel</a> (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/thirteenth-tuc-meeting/">Thirteenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/tuc-meeting/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/tuc-meeting/page/2/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/tuc-meeting/page/3/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tuc-meeting/index.xml b/tags/tuc-meeting/index.xml
new file mode 100644
index 00000000..4b90953d
--- /dev/null
+++ b/tags/tuc-meeting/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>TUC Meeting on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/tuc-meeting/</link>
+    <description>Recent content in TUC Meeting on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 30 Aug 2024 09:00:00 -0800</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/tuc-meeting/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/tuc-meeting/page/1/index.html b/tags/tuc-meeting/page/1/index.html
new file mode 100644
index 00000000..fa9624b7
--- /dev/null
+++ b/tags/tuc-meeting/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/tuc-meeting/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/tuc-meeting/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/tuc-meeting/">
+  </head>
+</html>
diff --git a/tags/tuc-meeting/page/2/index.html b/tags/tuc-meeting/page/2/index.html
new file mode 100644
index 00000000..38fdcea1
--- /dev/null
+++ b/tags/tuc-meeting/page/2/index.html
@@ -0,0 +1,1470 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/twelfth-tuc-meeting/">Twelfth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.</p>
+<p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j, …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eleventh-tuc-meeting/">Eleventh TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.</p>
+<p>This TUC meeting will be a one-day event preceding the <a href="https://sigmod2018.org/">SIGMOD/PODS …</a></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/tenth-tuc-meeting/">Tenth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This will be a one-day event at the <a href="http://www.vldb.org/2017">VLDB 2017</a> conference in Munich, Germany on September 1, 2017.</p>
+<p>Topics and activities of interest in these TUC meetings are:</p>
+<ul>
+<li>Presentation on graph data management usage scenarios.</li>
+<li>Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.</li>
+<li>Interaction with the new LDBC Board of Directors and the LDBC organisation officials.</li>
+</ul>
+<p>We welcome all users of RDF …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/ninth-tuc-meeting/">Ninth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf">SAP Headquarters</a> in Walldorf, Germany on February 9+10, 2017.</p>
+<p>This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking experiences.</li>
+<li>Presentation of the …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/eighth-tuc-meeting/">Eighth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event/eighth-tuc-meeting/attachments at <a href="http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf">Oracle Conference Center</a> in Redwood Shores facility on <strong>Wednesday and Thursday June 22-23, 2016</strong>.</p>
+<p>This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:</p>
+<ul>
+<li>Two day …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/seventh-tuc-meeting/">Seventh TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at <a href="http://www.research.ibm.com/labs/watson">IBM&rsquo;s TJ Watson</a> facility on <strong>Monday and Tuesday November 9/10, 2015.</strong></p>
+<p>This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:</p>
+<ul>
+<li>Two day event with one day devoted to User&rsquo;s experiences and one day devoted to benchmarking …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/tuc-meeting/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/tuc-meeting/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/tuc-meeting/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/tuc-meeting/page/3/" class="page-link hover-ripple">
+                    »
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/tuc-meeting/page/3/">
+                    »»
+                  </a>
+                </li>
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tuc-meeting/page/3/index.html b/tags/tuc-meeting/page/3/index.html
new file mode 100644
index 00000000..eb6ca7fe
--- /dev/null
+++ b/tags/tuc-meeting/page/3/index.html
@@ -0,0 +1,1466 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>TUC Meeting</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">TUC Meeting</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">TUC Meeting</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/sixth-tuc-meeting/">Sixth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.</p>
+<p>This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on <strong>Thursday and Friday March 19/20, 2015.</strong></p>
+<p>The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fifth-tuc-meeting/">Fifth TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce its fifth Technical User<br>
+Community (TUC) meeting.</p>
+<p>This will be a one-day event at the National Hellenic Research Institute<br>
+in Athens, Greece on <strong>Friday November 14, 2014</strong>.</p>
+<h3 id="agenda">Agenda</h3>
+<p>10:30 - 11:00 Coffee Break</p>
+<p>11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp; LDBC project status update (<a href="https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx">Presentation</a>)</p>
+<p>11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status</p>
+<p>Feedback …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/fourth-tuc-meeting/">Fourth TUC meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.</p>
+<p>This will be a one-day event at CWI in Amsterdam on <em>Thursday April 3, 2014</em>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology. …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/third-tuc-meeting/">Third TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!</p>
+<p>This will be a one day event in London on the <strong>19 November 2013</strong> running in collaboration with the <a href="http://www.graphconnect.com/london/">GraphConnect</a> event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: <strong>LDBCTUC</strong>.</p>
+<p>The TUC event will include:</p>
+<ul>
+<li>Introduction to the objectives and …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/second-tuc-meeting/">Second TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.</p>
+<p>This will be a two day event in Munich on the <strong>22/23rd April 2013</strong>.</p>
+<p>The event will include:</p>
+<ul>
+<li>Introduction to the objectives and progress of the LDBC project.</li>
+<li>Description of the progress of the benchmarks being evolved through Task Forces.</li>
+<li>Users explaining their use-cases and describing the limitations they have found in current technology.</li>
+<li>Industry …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/event/first-tuc-meeting/">First TUC Meeting</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    TUC MEETING
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the <strong>19/20th November 2012</strong>.</p>
+<p>So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:</p>
+<ul>
+<li>Introduction by the coordinator and technical director explaining the objectives of the …</li></ul>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            <nav aria-label="Page navigation">
+              <ul class="pagination justify-content-center">
+                
+                
+                <li class="page-item">
+                  <a class="page-link hover-ripple" href="/tags/tuc-meeting/">
+                    ««
+                  </a>
+                </li>
+                
+                
+                
+                <li class="page-item">
+                  <a href="/tags/tuc-meeting/page/2/" class="page-link hover-ripple">
+                    «
+                  </a>
+                </li>
+                
+                
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/" class="page-link hover-ripple">
+                        1
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item">
+                      <a href="/tags/tuc-meeting/page/2/" class="page-link hover-ripple">
+                        2
+                      </a>
+                    </li>
+                  
+                
+                  
+                  
+                  
+                    
+                  
+                  
+                  
+                    <li class="page-item page-item active ">
+                      <a href="/tags/tuc-meeting/page/3/" class="page-link hover-ripple">
+                        3
+                      </a>
+                    </li>
+                  
+                
+                
+                
+                
+                
+              </ul>
+            </nav>
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tutorial/index.html b/tags/tutorial/index.html
new file mode 100644
index 00000000..bee1de0f
--- /dev/null
+++ b/tags/tutorial/index.html
@@ -0,0 +1,1277 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>tutorial</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">tutorial</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">tutorial</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/">Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SPB
+    , SESAME
+    , RDF
+    , TUTORIAL
+    , GUIDE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Until now we have discussed several aspects of the <a href="/benchmarks/spb">Semantic Publishing Benchmark (SPB)</a> such as the <a href="/post/sizing-aws-instances-for-the-semantic-publishing-benchmark">difference in performance between virtual and real servers configuration</a>, how to choose an <a href="/post/making-semantic-publishing-execution-rules">appropriate query mix</a> for a benchmark run and our experience with using SPB in the development process of GraphDB for <a href="/post/using-ldbc-spb-to-find-owlim-performance-issues">finding performance issues</a>.</p>
+<p>In this post we provide a step-by-step guide on how to run SPB using the <a href="http://rdf4j.org/">Sesame</a> RDF data store on a fresh install …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/tutorial/index.xml b/tags/tutorial/index.xml
new file mode 100644
index 00000000..773f4c92
--- /dev/null
+++ b/tags/tutorial/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>tutorial on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/tutorial/</link>
+    <description>Recent content in tutorial on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 13 Jan 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/tutorial/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/tutorial/page/1/index.html b/tags/tutorial/page/1/index.html
new file mode 100644
index 00000000..edaf8888
--- /dev/null
+++ b/tags/tutorial/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/tutorial/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/tutorial/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/tutorial/">
+  </head>
+</html>
diff --git a/tags/virtuoso/index.html b/tags/virtuoso/index.html
new file mode 100644
index 00000000..d0f365af
--- /dev/null
+++ b/tags/virtuoso/index.html
@@ -0,0 +1,1297 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>virtuoso</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">virtuoso</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">virtuoso</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/">SNB Interactive Part 2: Modeling Choices</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p><a href="/benchmarks/snb">​SNB Interactive</a> is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.</p>
+<p>In the case of <a href="http://dbpedia.org/resource/Virtuoso_Universal_Server">Virtuoso</a>, we have played with <a href="http://dbpedia.org/resource/SQL">SQL</a> and <a href="http://dbpedia.org/resource/SPARQL">SPARQL</a> implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/">SNB Interactive Part 1: What Is SNB Interactive Really About?</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SNB
+    , VIRTUOSO
+    , INTERACTIVE
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.</p>
+<p>With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/virtuoso/index.xml b/tags/virtuoso/index.xml
new file mode 100644
index 00000000..bc950028
--- /dev/null
+++ b/tags/virtuoso/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>virtuoso on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/virtuoso/</link>
+    <description>Recent content in virtuoso on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Tue, 26 May 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/virtuoso/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/virtuoso/page/1/index.html b/tags/virtuoso/page/1/index.html
new file mode 100644
index 00000000..56a8b3bd
--- /dev/null
+++ b/tags/virtuoso/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/virtuoso/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/virtuoso/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/virtuoso/">
+  </head>
+</html>
diff --git a/tags/workshop/index.html b/tags/workshop/index.html
new file mode 100644
index 00000000..e0537c8e
--- /dev/null
+++ b/tags/workshop/index.html
@@ -0,0 +1,1324 @@
+<!DOCTYPE html>
+
+<html lang="en-us"><head>
+  <meta charset="utf-8">
+  <title>workshop</title>
+
+  <!-- mobile responsive meta -->
+  <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
+  <meta name="description" content="Linked Data Benchmark Council Website">
+  
+  <meta name="author" content="LDBC">
+  <meta name="generator" content="Hugo 0.114.1">
+
+  <!-- plugins -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/slick/slick.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/fontawesome/font-awesome.min.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/animate/animate.css">
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/plugins/venobox/venobox.css">
+  
+
+  <!-- Main Stylesheet -->
+  
+  <link rel="stylesheet" href="https://ldbcouncil.org/scss/style.min.css" media="screen">
+
+  <!-- Favicon -->
+  <link rel="shortcut icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+  <link rel="icon" href="https://ldbcouncil.org/images/favicon.png " type="image/x-icon">
+
+  <!-- RSS -->
+  <link rel="alternate" href="https://ldbcouncil.org/index.xml" type="application/rss+xml" title="Linked Data Benchmark Council" />
+
+  <!-- Custom JS -->
+  <script type="module" type="text/javascript" src="https://ldbcouncil.org/js/isotope.pkgd.min.js"></script><script type="module" type="text/javascript" src="https://ldbcouncil.org/js/wowchemy.js"></script>
+
+  <!-- Custom CSS -->
+  <link rel="stylesheet" href="https://ldbcouncil.org/css/custom-style.css">
+
+</head>
+<body>
+<!-- preloader start -->
+<div class="preloader">
+  
+</div>
+<!-- preloader end -->
+<!-- header -->
+<header>
+  
+
+  <!-- navigation -->
+  <div class="navigation bg-white position-relative">
+    <div class="container">
+      <nav class="navbar navbar-expand-lg navbar-light bg-white">
+        <a class="navbar-brand" href="/"><img class="img-fluid pb-lg-3" src="https://ldbcouncil.org/images/ldbc-title.png" alt="Linked Data Benchmark Council" style="scale: 70%;"></a>
+        <button class="navbar-toggler border-0" type="button" data-toggle="collapse" data-target="#navigation"
+          aria-controls="navigation" aria-expanded="false" aria-label="Toggle navigation">
+          <span class="navbar-toggler-icon"></span>
+        </button>
+
+        <div class="collapse navbar-collapse text-center" id="navigation">
+          <ul class="navbar-nav ml-auto">
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="/">Home</a>
+              <div class="dropdown-menu" >
+                <a class="dropdown-item" href="/introduction">Introduction</a>
+              </div>
+            </li>
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Benchmarks
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/benchmarks/overview">Overview of LDBC Benchmarks</a>
+                
+                <a class="dropdown-item" href="/benchmarks/graphalytics">Graphalytics Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/spb">Semantic Publishing Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/snb">Social Network Benchmark</a>
+                
+                <a class="dropdown-item" href="/benchmarks/finbench">Financial Benchmark</a>
+                
+                <a class="dropdown-item" href="/developer-community">Developer Community</a>
+                
+                <a class="dropdown-item" href="/benchmarks/fair-use-policies">Fair Use Policies</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                GQL&NonBreakingSpace;Community
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/gql-community/overview">Overview</a>
+                
+                <a class="dropdown-item" href="/gql-community/lex">LEX Working Group</a>
+                
+                <a class="dropdown-item" href="/pages/opengql-announce">Open GQL Tools</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item dropdown">
+              <a class="nav-link dropdown-toggle" href="#" role="button" data-toggle="dropdown" aria-haspopup="true"
+                aria-expanded="false">
+                Membership
+              </a>
+              <div class="dropdown-menu" >
+                
+                <a class="dropdown-item" href="/organizational-members">Organizational Members</a>
+                
+                <a class="dropdown-item" href="/leadership">Leadership</a>
+                
+                <a class="dropdown-item" href="/becoming-a-member">Becoming a Member</a>
+                
+                <a class="dropdown-item" href="/constitutional-documents">Constitutional Documents</a>
+                
+              </div>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/post">Posts</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/event">Events</a>
+            </li>
+            
+            
+            
+            <li class="nav-item">
+              <a class="nav-link" href="/publication">Publications</a>
+            </li>
+            
+            
+          </ul>
+
+          
+          
+
+          
+          
+        </div>
+      </nav>
+    </div>
+  </div>
+  <!-- /navigation -->
+</header>
+<!-- /header -->
+
+
+
+
+
+<!-- page title -->
+<section class="section bg-cover overlay"> 
+  <div class="container">
+    <div class="row">
+      <div class="col-12">
+        
+        
+        <h2 class="text-white mb-3">workshop</h2>
+        
+        <!-- breadcrumb -->
+        <nav aria-label="breadcrumb">
+          <ol class="breadcrumb bg-transparent p-0">
+            <li class="breadcrumb-item font-weight-semebold"><a class="text-white" href="/">Home</a></li>
+        
+            <li class="breadcrumb-item font-weight-semebold active text-primary" aria-current="page">workshop</li>
+        
+          </ol>
+        </nav>
+        
+      </div>
+    </div>
+  </div>
+</section>
+<!-- /page title -->
+
+
+<!-- blog -->
+<section class="section">
+  <div class="container">
+    <div class="row">
+      <div class="col-lg-8 order-2 order-lg-1">
+        <div class="row">
+          
+          
+          
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+            
+            
+            
+          
+          
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/">SNB and Graphs Related Presentations at GRADES &#39;15</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRAPHALYTICS
+    , GRADES
+    , SNB
+    , DATAGEN
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.</p>
+<p>Among the papers published in this edition we have &ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/">LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    SIGMOD
+    , GRADES
+    , SNB
+    , GRAPHALYTICS
+    , WORKSHOP
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.</p>
+<p>On the industry track, LDBC will be presenting the <em>Social Network Benchmark Interactive …</em></p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- blog post -->
+          <article class="col-md-6 mb-4">
+            <div class="project-item mb-5">
+  <div style="padding-bottom: 10px;">
+    
+    <h4><a class="text-dark" href="https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/">2nd International Workshop on Benchmarking RDF Systems</a></h4>
+    <h5 class="d-inline-block mr-3">Tags:</h5>
+    WORKSHOP
+    , CFP
+    , BENCHMARK
+    , BERSYS
+    
+  </div>
+  <div class="position-relative mb-4 overflow-hidden">
+    
+        <p>Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate …</p>
+    
+  </div>
+</div>
+
+          </article>
+          
+          <!-- pagination -->
+          <div class="col-12 mt-5">
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+          </div>
+          <!-- /pagination -->
+        </div>
+      </div>
+      <!-- sidebar -->
+<aside class="col-lg-4 order-1 order-lg-2">
+  <!-- latest post -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4">Latest updates</h4>
+    <!-- post-item -->
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/eighteenth-tuc-meeting/">
+          <h5 class="mt-0">Eighteenth TUC Meeting</h5>
+        </a>
+        24 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/event/seventeenth-tuc-meeting/">
+          <h5 class="mt-0">Seventeenth TUC Meeting</h5>
+        </a>
+        18 Apr 2024
+      </div>
+      
+      
+    </div>
+    
+    <div class="media border-bottom border-color pb-3 mb-3">
+      <div class="media-body">
+        <a href="https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/">
+          <h5 class="mt-0">Record-Breaking SNB Interactive Results for GraphScope</h5>
+        </a>
+        26 May 2024
+      </div>
+      
+      
+    </div>
+    
+  </div>
+  <!-- tags -->
+  <div class="bg-white px-4 py-5 box-shadow mb-5">
+    <h4 class="mb-4"></h4>
+    <ul class="list-inline tag-list">
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/amazon">AMAZON</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/analytics">ANALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/aws">AWS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmark">BENCHMARK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/benchmarking">BENCHMARKING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bersys">BERSYS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/bi">BI</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/cfp">CFP</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/chile">CHILE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/database">DATABASE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/datagen">DATAGEN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/design">DESIGN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/developer">DEVELOPER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/driver">DRIVER</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ec2">EC2</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/finbench">FINBENCH</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/flink">FLINK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/gql">GQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/grades">GRADES</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/graphalytics">GRAPHALYTICS</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/guide">GUIDE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/industry">INDUSTRY</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/instance-matching">INSTANCE-MATCHING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/interactive">INTERACTIVE</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/ldbc">LDBC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/rdf">RDF</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/santiago">SANTIAGO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sesame">SESAME</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sigmod">SIGMOD</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/snb">SNB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/social-network">SOCIAL-NETWORK</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/sparql">SPARQL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/spb">SPB</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/test-run">TEST-RUN</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc">TPC</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tpc-c">TPC-C</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tu-delft">TU-DELFT</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tuc-meeting">TUC-MEETING</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/tutorial">TUTORIAL</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/virtuoso">VIRTUOSO</a></li>
+      <li class="list-inline-item"><a class="hover-ripple" href="/tags/workshop">WORKSHOP</a></li>
+    </ul>
+  </div>
+  
+  
+</aside>
+<!-- /sidebar -->
+    </div>
+  </div>
+</section>
+
+
+<footer>
+  
+  <div class="section bg-secondary">
+    <div class="container">
+      <div class="row justify-content-between">
+        
+        <div class="col-lg-5 mb-5 mb-lg-0">
+          
+          <a class="mb-4 d-inline-block" href="/"><img class="img-fluid"
+              src="https://ldbcouncil.org/images/ldbc.png" alt="Linked Data Benchmark Council"></a>
+          <p class="text-light mb-5">LDBC came out of an EU FP7 project and is now a non-profit organization sustained by its members. Contact us at info AT ldbcouncil DOT org.</p>
+          <h4 class="text-white mb-4"></h4>
+          
+          <ul class="list-inline social-icon-alt">
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://twitter.com/LDBCouncil"><i class="fa fa-twitter"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="https://github.com/ldbc"><i class="fa fa-github"></i></a>
+            </li>
+            
+            <li class="list-inline-item">
+              <a class="hover-ripple" href="/index.xml"><i class="fa fa-rss"></i></a>
+            </li>
+            
+          </ul>
+        </div>
+        <div class="col-lg-6">
+          <div class="row">
+            
+            
+            
+            
+            <div class="col-12">
+
+  <!-- Twitter timeline -->
+  
+  
+  <a class="twitter-timeline" data-height="450" data-theme="dark"  href="https://twitter.com/LDBCouncil" style="background-color: #252d39;">Tweets by LDBCouncil</a> <script async src="https://platform.twitter.com/widgets.js" charset="utf-8"></script> 
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+  
+  <div class="bg-secondary-darken py-4">
+    <div class="container">
+      <div class="row">
+        <div class="col-md-6 text-center text-md-left mb-3 mb-md-0">
+          <p class="mb-0 text-white">LDBC</p>
+        </div>
+        <div class="col-md-6 text-center text-md-right">
+          <ul class="list-inline">
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/" class="text-white"></a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Byelaws.1.5.ADOPTED.2024-01-12.pdf" class="text-white">Byelaws</a></li>
+            
+            <li class="list-inline-item mx-0"><a class="d-inline-block px-3 text-white" href="/docs/LDBC.Articles.of.Association.ADOPTED.2023-03-30.pdf" class="text-white">Articles of Association</a></li>
+            
+          </ul>
+        </div>
+      </div>
+    </div>
+  </div>
+</footer>
+
+
+
+
+<!-- Google Map API -->
+
+
+<!-- JS Plugins -->
+
+<script src="https://ldbcouncil.org/plugins/jQuery/jquery.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/bootstrap/bootstrap.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/slick/slick.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/google-map/gmap.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/venobox/venobox.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/filterizr/jquery.filterizr.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/fuse.min.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/mark.js"></script>
+
+<script src="https://ldbcouncil.org/plugins/search/search.js"></script>
+
+
+<!-- Main Script -->
+
+<script src="https://ldbcouncil.org/js/script.min.js"></script>
+
+<!-- google analitycs -->
+
+
+<div id="modal" class="modal fade" role="dialog">
+  <div class="modal-dialog">
+    <div class="modal-content">
+      <div class="modal-header">
+        <h5 class="modal-title"></h5>
+        <button type="button" class="close" data-dismiss="modal" aria-label="Close">
+          <span aria-hidden="true">&times;</span>
+        </button>
+      </div>
+      <div class="modal-body">
+        <pre><code class="tex hljs"></code></pre>
+      </div>
+      <div class="modal-footer">
+        <a class="btn btn-outline-primary my-1 btn-sm js-copy-cite" href="#" target="_blank">
+          
+          COPY
+        </a>
+        <a class="btn btn-outline-primary my-1 btn-sm js-download-cite" href="#" target="_blank">
+          
+          DOWNLOAD
+        </a>
+        <div id="modal-error"></div>
+      </div>
+    </div>
+  </div>
+</div>
+
+
+</body>
+
+</html>
\ No newline at end of file
diff --git a/tags/workshop/index.xml b/tags/workshop/index.xml
new file mode 100644
index 00000000..3294f6af
--- /dev/null
+++ b/tags/workshop/index.xml
@@ -0,0 +1,5468 @@
+<?xml version="1.0" encoding="utf-8" standalone="yes"?>
+<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
+  <channel>
+    <title>workshop on Linked Data Benchmark Council</title>
+    <link>https://ldbcouncil.org/tags/workshop/</link>
+    <description>Recent content in workshop on Linked Data Benchmark Council</description>
+    <generator>Hugo -- gohugo.io</generator>
+    <language>en-us</language>
+    <copyright>&amp;copy; Copyright LDBC 2024</copyright>
+    <lastBuildDate>Fri, 29 May 2015 00:00:00 +0000</lastBuildDate><atom:link href="https://ldbcouncil.org/tags/workshop/index.xml" rel="self" type="application/rss+xml" />
+    <item>
+      <title>Eighteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</link>
+      <pubDate>Fri, 30 Aug 2024 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Shipeng Qi (AntGroup), Wenyuan Yu (Alibaba Demo), Yan Zhou (CreateLink)&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located in &lt;strong&gt;Guangzhou&lt;/strong&gt; with &lt;a href=&#34;https://vldb.org/2024/&#34;&gt;VLDB 2024&lt;/a&gt; on &lt;strong&gt;August 30-31 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/aVPrrcxXpSwrWPnh6&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;august-30-friday&#34;&gt;August 30, Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; &lt;a href=&#34;https://www.langhamhotels.com/en/the-langham/guangzhou/&#34;&gt;Langham Place&lt;/a&gt;, Guangzhou, &lt;strong&gt;room 1&lt;/strong&gt;,&lt;br&gt;
+co-located with VLDB (N0.630-638 Xingang Dong Road, Haizhu District, Guangzhou, China). See the map &lt;a href=&#34;https://maps.app.goo.gl/86jD3Dy9Aa7bwLs36&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;august-31-saturday&#34;&gt;August 31, Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Alibaba Center, Guangzhou (N0.88 Dingxin Road, Haizhu District, Guangzhou, China), near to VLDB Langham Place. See the map &lt;a href=&#34;https://maps.app.goo.gl/HgEVafZMRmrzUsgW8&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Agenda:&lt;/strong&gt; TBA&lt;/p&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventeenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</link>
+      <pubDate>Sun, 09 Jun 2024 09:00:00 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventeenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Renzo Angles, Sebastián Ferrada&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a one-day in-person workshop, co-located in &lt;strong&gt;Santiago de Chile&lt;/strong&gt; with &lt;a href=&#34;https://2024.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2024&lt;/a&gt; on &lt;strong&gt;June 9 (Sunday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The workshop will be held in the &lt;strong&gt;Hotel Plaza El Bosque Ebro&lt;/strong&gt; (&lt;a href=&#34;https://www.plazaelbosque.cl&#34;&gt;https://www.plazaelbosque.cl&lt;/a&gt;), which is two blocks away from SIGMOD&amp;rsquo;s venue. See the map &lt;a href=&#34;https://maps.app.goo.gl/78oiw3zo2pH3gy5R6&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/XXgaQfwBZAMMZJb78&#34;&gt;this form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in Chile time (GMT-4).&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Each speaker will have 20 minutes for exposition plus 5 minutes for questions.&lt;/strong&gt;&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Time&lt;/th&gt;
+&lt;th&gt;Speaker&lt;/th&gt;
+&lt;th&gt;Title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;Welcome&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Canelo&amp;rdquo; saloon&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC Vice-chair)&lt;/td&gt;
+&lt;td&gt;Status of the LDBC Extended GQL Schema Working Group&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;Hannes Voigt (Neo4j)&lt;/td&gt;
+&lt;td&gt;Inside the Standardization Machine Room: How ISO/IEC 39075:2024 – GQL was produced&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;Calin Iorgulescu (Oracle)&lt;/td&gt;
+&lt;td&gt;PGX.D: Distributed graph processing engine&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa, Inc.)&lt;/td&gt;
+&lt;td&gt;A Unified Graph Framework with SCC (Storage-Compute Coupled) and HDC (High-Density Computing) Clustering&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;Daan de Graaf (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;Algorithm Support in a Graph Database, Done Right&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:30&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University and IUF, France)&lt;/td&gt;
+&lt;td&gt;Transforming Property Graphs&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;Brunch&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;Juan Sequeda (data.world)&lt;/td&gt;
+&lt;td&gt;A Benchmark to Understand the Role of Knowledge Graphs on Large Language Model&amp;rsquo;s Accuracy for Question Answering on Enterprise SQL Databases&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Linköping University)&lt;/td&gt;
+&lt;td&gt;FedShop: A Benchmark for Testing the Scalability of SPARQL Federation Engines&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;Olaf Hartig (Amazon)&lt;/td&gt;
+&lt;td&gt;Datatypes for Lists and Maps in RDF Literals&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI and MotherDuck)&lt;/td&gt;
+&lt;td&gt;The state of DuckPGQ&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Coffee break&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;Juan Reutter (IMFD and PUC Chile)&lt;/td&gt;
+&lt;td&gt;MillenniumDB: A Persistent, Open-Source, Graph Database&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Carlos Rojas (IMFD)&lt;/td&gt;
+&lt;td&gt;WDBench: A Wikidata Graph Query Benchmark&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;Sebastián Ferrada (IMFD and Univ. de Chile)&lt;/td&gt;
+&lt;td&gt;An algebra for evaluating path queries&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:30&lt;/td&gt;
+&lt;td&gt;Dinner&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Record-Breaking SNB Interactive Results for GraphScope</title>
+      <link>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</link>
+      <pubDate>Sun, 26 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/record-breaking-snb-interactive-results-for-graphscope/</guid>
+      <description>&lt;p&gt;We are happy to annonunce new &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb-interactive/&#34;&gt;audited results for the SNB Interactive workload&lt;/a&gt;, achieved by the open-source &lt;a href=&#34;https://github.com/alibaba/GraphScope&#34;&gt;GraphScope Flex&lt;/a&gt; system.&lt;/p&gt;
+&lt;p&gt;The current audit of the system has broken several records:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;It achieved 130.1k ops/s on scale factor 100, compared to the previous record of 48.8k ops/s.&lt;/li&gt;
+&lt;li&gt;It achieved 131.3k ops/s on scale factor 300, compared to the previous record of 48.3k ops/s.&lt;/li&gt;
+&lt;li&gt;It is the first system to successfully complete the benchmark on scale factor 1000. It achieved a throughput of 127.8k ops/s&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The audit was commissioned by the &lt;a href=&#34;https://www.alibabacloud.com/&#34;&gt;Alibaba Cloud&lt;/a&gt; and was conducted by &lt;a href=&#34;https://www.linkedin.com/in/arnau-prat-a70283bb/&#34;&gt;Dr. Arnau Prat-Pérez&lt;/a&gt;, one of the original authors of the SNB Interactive benchmark. The queries were implemented as C++ stored procedures and the benchmark was executed on the Alibaba Cloud&amp;rsquo;s infrastructure. The &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-executive_summary.pdf&#34;&gt;executive summary&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/LDBC_SNB_I_20240514_SF100-300-1000_graphscope.pdf&#34;&gt;full disclosure report&lt;/a&gt;, and &lt;a href=&#34;%5B/benchmarks/snb/%5D(https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/audits/LDBC_SNB_I_20240514_SF100-300-1000_graphscope-attachments.tar.gz)&#34;&gt;supplementary package&lt;/a&gt; describe the benchmark&amp;rsquo;s steps and include instructions for reproduction.&lt;/p&gt;
+&lt;p&gt;LDBC would like to congratulate the GraphScope Flex team on their record-breaking results.&lt;/p&gt;
+&lt;div align=&#34;center&#34;&gt;&lt;img src=&#34;https://ldbcouncil.org/images/graphscope.svg&#34; width=&#34;200&#34;&gt;&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Launching open-source language tools for ISO/IEC GQL</title>
+      <link>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</link>
+      <pubDate>Thu, 09 May 2024 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-announces-open-source-gql-tools/</guid>
+      <description>&lt;p&gt;Following the publication of ISO/IEC GQL (graph query language) in April 2024, LDBC today launches open-source language engineering tools to help implementers, and assist in generation of code examples and tests for the GQL language. See this &lt;a href=&#34;https://ldbcouncil.org/pages/opengql-announce&#34;&gt;announcement from Alastair Green, Vice-chair of LDBC&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;These tools are the work of the &lt;strong&gt;LDBC GQL Implementation Working Group&lt;/strong&gt;, headed up by Michael Burbidge. Damian Wileński and Dominik Tomaszuk have worked with Michael to create these artefacts based on his ANTLR grammar for GQL.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the Official Release of LDBC Financial Benchmark v0.1.0</title>
+      <link>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</link>
+      <pubDate>Tue, 27 Jun 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-official-release-of-ldbc-financial-benchmark/</guid>
+      <description>&lt;p&gt;We are delighted to announce the official release of the initial version (v0.1.0) of &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench)&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project defines a graph database benchmark targeting financial scenarios such as anti-fraud and risk control. It is maintained by the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;LDBC FinBench Task Force&lt;/a&gt;. The benchmark has one workload currently, &lt;strong&gt;Transaction Workload&lt;/strong&gt;, capturing OLTP scenario with complex read queries that access the neighbourhood of a given node in the graph and write queries that continuously insert or delete data in the graph.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench differs in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. For a brief overview, see the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/finbench-talk-16th-tuc.pdf&#34;&gt;slides&lt;/a&gt; in the 16th TUC. The &lt;a href=&#34;https://arxiv.org/pdf/2306.15975.pdf&#34;&gt;Financial Benchmark&amp;rsquo;s specification&lt;/a&gt; can be found on arXiv.&lt;/p&gt;
+&lt;p&gt;The release of FinBench initial version (v0.1.0) was approved by LDBC on June 23, 2023. It is the good beginning of FinBench. In the future, the FinBench Task Force will polish the benchmark continuously.&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or qishipeng.qsp at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</link>
+      <pubDate>Fri, 23 Jun 2023 09:00:00 -0800</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Oskar van Rest, Alastair Green, Gábor Szárnyas&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2023.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2023&lt;/a&gt; on &lt;strong&gt;June 23-24 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10- and 15-minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online. &lt;strong&gt;If you would like to participate please register using &lt;a href=&#34;https://forms.gle/T6bwVHzK9V5FaKyR9&#34;&gt;our form&lt;/a&gt;.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC will host a &lt;strong&gt;social event&lt;/strong&gt; on Friday at the &lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In addition, AWS will host a &lt;strong&gt;Happy Hour&lt;/strong&gt; (rooftop grill with beverages) on Saturday on the Amazon Nitro South building&amp;rsquo;s 8th floor deck: &lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;program&#34;&gt;Program&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;All times are in PDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;friday&#34;&gt;Friday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Hyatt Regency Bellevue on Seattle&amp;rsquo;s Eastside, &lt;strong&gt;room Grand K&lt;/strong&gt;, co-located with SIGMOD (&lt;a href=&#34;https://www.hyatt.com/en-US/hotel/washington/hyatt-regency-bellevue-on-seattles-eastside/belle&#34;&gt;900 Bellevue Way NE, Bellevue, WA 98004-4272&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;08:30&lt;/td&gt;
+&lt;td&gt;08:45&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;LDBC – State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-ldbc-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Frk7ITssaSY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;08:50&lt;/td&gt;
+&lt;td&gt;09:05&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC / WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/keith-hare-an-update-on-the-gql-and-sql-pgq-standards-efforts.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQYkal_0j6E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:10&lt;/td&gt;
+&lt;td&gt;09:25&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (Neo4j / WG3)&lt;/td&gt;
+&lt;td&gt;GQL - Introduction to a new query language standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/stefan-plantikow-gql-v1.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (University of Edinburgh &amp;amp; RelationalAI)&lt;/td&gt;
+&lt;td&gt;Formalizing GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/leonid-libkin-formalizing-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/YZE1a00h1I4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Semen Panenkov (JetBrains Research)&lt;/td&gt;
+&lt;td&gt;Mechanizing the GQL semantics in Coq – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/semyon-panenkov-gql-in-coq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/5xBGohqWCzo&#34;&gt;videos&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;SQL Property Graphs in Oracle Database and Oracle Graph Server (PGX) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/oskar-van-rest-sql-property-graphs-in-oracle-database-and-oracle-graph-server-pgx.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/owM9WiQubpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s organizational changes and fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-ldbc-corporate-restructuring-and-fair-use-policies.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;Ioana Manolescu (INRIA)&lt;/td&gt;
+&lt;td&gt;Integrating Connection Search in Graph Queries – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ioana-manolescu-integrating-connection-search-in-graph-queries.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LQPnmcrkUpY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Maciej Besta (ETH Zurich)&lt;/td&gt;
+&lt;td&gt;Neural Graph Databases with Graph Neural Networks – &lt;a href=&#34;https://youtu.be/ce5qNievRNs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;Longbin Lai (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;To Revisit Benchmarking Graph Analytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/longbin-lai-benchmark-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/s9Vtt-6t_FI&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;The World of Graph Databases from An Industry Perspective – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/yuanyuan-tian-world-of-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AZuP_b95GPM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Alin Deutsch (UC San Diego &amp;amp; TigerGraph)&lt;/td&gt;
+&lt;td&gt;TigerGraph&amp;rsquo;s Parallel Computation Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alin-deutsch-tigergraphs-computation-model.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/vcxdieJB80Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;Applications of a Native Distributed Graph Database in the Financial Industry – &lt;a href=&#34;https://youtu.be/GCCT79Sps9I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Ricky Sun (Ultipa)&lt;/td&gt;
+&lt;td&gt;Design of highly scalable graph database systems – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ricky-sun-ultipa.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Sg1F64O4vGM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;The LDBC SNB implementation in TuGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-the-ldbc-snb-implementation-in-tugraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/fy8AuVerwnY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Shipeng Qi (Ant Group)&lt;/td&gt;
+&lt;td&gt;FinBench: The new LDBC benchmark targeting financial scenario – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/shipeng-qi-finbench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/0xLZadDOfZk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;host: Heng Lin (Ant Group), panelists: Longbin Lai (Alibaba Damo Academy), Ricky Sun (Ultipa), Gabor Szarnyas (CWI), Yuanyuan Tian (Gray Systems Lab, Microsoft)&lt;/td&gt;
+&lt;td&gt;FinBench panel – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/heng-lin-finbench-panel.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:00&lt;/td&gt;
+&lt;td&gt;22:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;dinner&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;&lt;a href=&#34;https://www.blackbottleseattle.com/&#34;&gt;Black Bottle gastrotavern&lt;/a&gt; in Belltown: &lt;a href=&#34;https://goo.gl/maps/hQzBRR2nerZEQExw7&#34;&gt;2600 1st Ave (on the corner of Vine), Seattle, WA 98121&lt;/a&gt;&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday&#34;&gt;Saturday&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Location:&lt;/strong&gt; Amazon Nitro South building, &lt;strong&gt;room 03.204&lt;/strong&gt; (&lt;a href=&#34;https://goo.gl/maps/md5kWUHaNUGhR9JB7&#34;&gt;2205 8th Ave, Seattle, WA 98121&lt;/a&gt;)&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:00&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Brad Bebee (AWS)&lt;/td&gt;
+&lt;td&gt;Customers don&amp;rsquo;t want a graph database, so why are we still here? – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/brad-bebee-tuc-keynote.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/bJlkpDC--fM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Fast and Efficient Update Handling for Graph H2TAP – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/muhammad-attahir-jibril-fast-and-efficient-update-handling-for-graph-h2tap.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/e8ZAszBsXV0&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Gabor Szarnyas (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark and Graphalytics – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-social-network-benchmark-and-graphalytics.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;Atanas Kiryakov and Tomas Kovachev (Ontotext)&lt;/td&gt;
+&lt;td&gt;GraphDB – Benchmarking against LDBC SNB &amp;amp; SPB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tomas-kovatchev-atanas-kiryakov-benchmarking-graphdb-with-snb-and-spb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/U6OPpNFOWqg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;11:50&lt;/td&gt;
+&lt;td&gt;Roi Lipman (Redis Labs)&lt;/td&gt;
+&lt;td&gt;Delta sparse matrices within RedisGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/roi-lipman-delta-matrix.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/qfKsplV4Ihk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;12:05&lt;/td&gt;
+&lt;td&gt;Rathijit Sen (Microsoft)&lt;/td&gt;
+&lt;td&gt;Microarchitectural Analysis of Graph BI Queries on RDBMS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/rathijit-sen-microarchitectural-analysis.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/55B8CkH09js&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:10&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on your own&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (JCC)&lt;/td&gt;
+&lt;td&gt;LEX &amp;ndash; LDBC Extended GQL Schema – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/alastair-green-lex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/DVpeb4Ce9Uw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Ora Lassila (AWS)&lt;/td&gt;
+&lt;td&gt;Why limit yourself to {RDF, LPG} when you can do {RDF, LPG}, too – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/ora-lassila-why-limit-yourself-to-lpg-when-you-can-do-rdf-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7uAInoUwdds&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck, University of London)&lt;/td&gt;
+&lt;td&gt;PG-Schema: a proposal for a schema language for property graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/jan-hidders-pg-schema.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yQNL8hBTE4M&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Max de Marzi (RageDB and RelationalAI)&lt;/td&gt;
+&lt;td&gt;RageDB: Building a Graph Database in Anger – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/max-de-marzi-ragedb-building-a-graph-database-in-anger.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/LBbF8aslYFE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;15:45&lt;/td&gt;
+&lt;td&gt;Umit Catalyurek (AWS)&lt;/td&gt;
+&lt;td&gt;HPC Graph Analytics on the OneGraph Model – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/umit-catalyurek-onegraph-hpc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/64tv5LA6Wr8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;David J. Haglin (Trovares)&lt;/td&gt;
+&lt;td&gt;How LDBC impacts Trovares – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/david-haglin-trovares.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;16:25&lt;/td&gt;
+&lt;td&gt;Wenyuan Yu (Alibaba Damo Academy)&lt;/td&gt;
+&lt;td&gt;GraphScope Flex: A Graph Computing Stack with LEGO-Like Modularity – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/wenyuan-yu-graphscope-flex.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRikoyDmMks&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;16:40&lt;/td&gt;
+&lt;td&gt;Scott McMillan (Carnegie Mellon University)&lt;/td&gt;
+&lt;td&gt;Graph processing using GraphBLAS – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/scott-mcmillan-graph-processing-using-graphblas.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/yb4hGBhUzQQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:45&lt;/td&gt;
+&lt;td&gt;16:55&lt;/td&gt;
+&lt;td&gt;Tim Mattson (Intel)&lt;/td&gt;
+&lt;td&gt;Graphs (GraphBLAS) and storage (TileDB) as Sparse Linear algebra – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixteenth-tuc-meeting/attachments/tim-mattson-graphblas-and-tiledb.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;20:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;happy hour (rooftop grill with beverages)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;on the Nitro South building&amp;rsquo;s 8th floor deck&lt;/em&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;tuc-event-locations&#34;&gt;TUC event locations&lt;/h4&gt;
+&lt;p&gt;A &lt;a href=&#34;https://www.google.com/maps/d/u/0/edit?mid=19_fi4fV-3-PZkNWCCcmhU86ct2EZXbgo&#34;&gt;map of the LDBC TUC events&lt;/a&gt; we hosted so far.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB – Early 2023 updates</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</link>
+      <pubDate>Wed, 15 Feb 2023 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-early-2023-updates/</guid>
+      <description>&lt;p&gt;2023 has been an eventful year for us so far. Here is a summary of our recent activities.&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Our paper &lt;a href=&#34;https://ldbcouncil.org/docs/papers/ldbc-snb-bi-vldb-2022.pdf&#34;&gt;The LDBC Social Network Benchmark: Business Intelligence Workload&lt;/a&gt; was published in PVLDB.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;David Püroja just completed his MSc thesis on creating a design towards &lt;a href=&#34;https://ldbcouncil.org/docs/papers/msc-thesis-david-puroja-snb-interactive-v2-2023.pdf&#34;&gt;SNB Interactive v2&lt;/a&gt; at CWI&amp;rsquo;s Database Architectures group. David and I gave a deep-dive talk at the FOSDEM conference&amp;rsquo;s graph developer room titled &lt;a href=&#34;https://fosdem.org/2023/schedule/event/graph_ldbc/&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=YNF6z6gtXY4&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;I gave a lightning talk at FOSDEM&amp;rsquo;s HPC developer room titled &lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;The LDBC Benchmark Suite&lt;/a&gt; (&lt;a href=&#34;https://www.youtube.com/watch?v=q26DHnQFw54&#34;&gt;YouTube mirror&lt;/a&gt;).&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Our auditors have successfully benchmark a number of systems:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;SPB with the Ontotext GraphDB systems for the SF3 and SF5 data sets (auditor: Pjotr Scholtze)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the Ontotext GraphDB system for the SF30 data set (auditor: David Püroja)&lt;/li&gt;
+&lt;li&gt;SNB Interactive with the TuGraph system running in the Aliyun cloud for the SF30, SF100, and SF300 data sets (auditor: Márton Búr)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The results and the full disclosure reports are available under the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb/&#34;&gt;SPB&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb/&#34;&gt;SNB benchmark pages&lt;/a&gt;.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC SNB Datagen – The winding path to SF100K</title>
+      <link>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</link>
+      <pubDate>Tue, 13 Sep 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-snb-datagen-the-winding-path-to-sf100k/</guid>
+      <description>&lt;p&gt;LDBC SNB provides a data generator, which produces synthetic datasets, mimicking a social network’s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. More than two years have elapsed since my &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;last technical update&lt;/a&gt; on LDBC SNB Datagen, in which I discussed the reasons for moving the code to Apache Spark from the MapReduce-based Apache Hadoop implementation and the challenges I faced during the migration. Since then, we reached several goals such as we refactored the serializers to use Spark&amp;rsquo;s high-level writers to support the popular Parquet data format and to enable running on spot nodes; brought back factor generation; implemented support for the novel BI benchmark; and optimized the runtime to generate SF30K on 20 i3.4xlarge machines on AWS.&lt;/p&gt;
+&lt;h1 id=&#34;moving-to-sparksql&#34;&gt;Moving to SparkSQL&lt;/h1&gt;
+&lt;p&gt;We planned to move parts of the code to SparkSQL, an optimized runtime framework for tabular data. We hypothesized that this would benefit us on multiple fronts: SparkSQL offers an efficient batch analytics runtime, with higher level abstractions that are simpler to understand and work with, and we could easily add support for serializing to Parquet based on SparkSQL&amp;rsquo;s capabilites.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;Spark SQL is a Spark module for structured data processing. It provides a programming abstraction called DataFrames and can also act as a distributed SQL query engine. Spark SQL includes a cost-based optimizer, columnar storage, and code generation to make queries fast.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;Dealing with the dataset generator proved quite tricky, because it samples from various hand-written distributions and dictionaries, and contains complex domain logic, for which SparkSQL unsuitable. We assessed that the best thing we could do is wrap entire entity generation procedures in UDFs (user defined SQL functions). However, several of these generators return entity trees&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt;, which are spread across multiple tables by the serializer, and these would have needed to be split up. Further complicating matters, we would have also had to find a way to coordinate the inner random generators&amp;rsquo; state between the UDFs to ensure deterministic execution. Weighing these and that we could not find much benefit in SparkSQL, we ultimately decided to leave entity generation as it is. We limited the SparkSQL refactor to the following areas:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;table manipulations related to shaping the output into the supported layouts and data types as set forth in the specification;&lt;/li&gt;
+&lt;li&gt;deriving the Interactive and BI datasets;&lt;/li&gt;
+&lt;li&gt;and generating the factor tables, which contain analytic information, such as population per country, number of friendships between city pairs, number of messages per day, etc., used by the substitution parameter generator to ensure predictable query runtimes.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;We refer to points (1.) and (2.) collectively as dataset transformation, while (3.) as factor generation. Initially, these had been part of the generator, extracted as part of this refactor, which resulted in cleaner, more maintainable design.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_df_0.png&#34; alt=&#34;Datagen stages&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The diagram above shows the components on a high level. The generator outputs a dataset called IR (intermediate representation), which is immediately written to disk. Then, the IR is input to the dataset transformation and factor generation stages, which respectively generate the final dataset and the factor tables. We are aware that spitting out the IR adds considerable runtime overhead and doubles the disk requirements in the worst-case scenario, however, we found that there&amp;rsquo;s no simple way to avoid&lt;br&gt;
+it, as the generator produces entity trees, which are incompatible with the flat, tabular, column oriented layout of SparkSQL. On the positive side, this design enables us to reuse the generator output for multiple transformations and add new factor tables without regenerating the data.&lt;/p&gt;
+&lt;p&gt;I&amp;rsquo;ll skip describing the social network graph dataset generator (i.e. stage 1) in any more detail, apart from its serializer, as that was the only part involved in the current refactor. If you are interested in more details, you may look up the &lt;a href=&#34;https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/&#34;&gt;previous blogpost in the series&lt;/a&gt; or the &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;Interactive benchmark specification&lt;/a&gt;.&lt;/p&gt;
+&lt;h1 id=&#34;transformation-pipeline&#34;&gt;Transformation pipeline&lt;/h1&gt;
+&lt;p&gt;The dataset transformation stage sets off where generation finished, and applies an array of pluggable transformations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;explodes edges and / or attributes into separate tables,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part and creates insert / delete batches for the BI workload,&lt;/li&gt;
+&lt;li&gt;subsets the snapshot part for the Interactive workload,&lt;/li&gt;
+&lt;li&gt;applies formatting related options such as date time representation,&lt;/li&gt;
+&lt;li&gt;serializes the data to a Spark supported format (CSV, Parquet),&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We utilize a flexible data pipeline that operates on the graph.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; apply&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;])&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M2&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Transform&lt;/code&gt; trait encodes a pure (side effect-free) function polymorphic over graphs, so that transformation pipelines can be expressed with ordinary function composition in a type safe manner. Let&amp;rsquo;s see some of the transformations we have.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToBiTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; keepImplicitDeletes&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationStart&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; simulationEnd&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Long&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Therefore, a transformation pipeline may look like this:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;RawToInteractiveTransform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;params&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; start&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; end&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;inputGraph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The &lt;code&gt;Graph&lt;/code&gt; record has a &lt;code&gt;definition&lt;/code&gt; field containing graph-global metadata, whereas &lt;code&gt;entities&lt;/code&gt; holds the datasets keyed by their entity type. There are 3 graph &lt;em&gt;modes&lt;/em&gt; currently: &lt;code&gt;Raw&lt;/code&gt;, &lt;code&gt;Interactive&lt;/code&gt; and &lt;code&gt;BI&lt;/code&gt;. The BI dataset has different layout than the rest, as it contains incremental inserts and deletes for the entities additionally to the bulk snapshot. This is captured in the &lt;code&gt;Layout&lt;/code&gt; dependent type, over which the entities are polymorphic.&lt;/p&gt;
+&lt;p&gt;It&amp;rsquo;s important to understand that &lt;code&gt;Graph&lt;/code&gt; holds &lt;code&gt;DataFrame&lt;/code&gt;s, and these are lazily computed by Spark. So, &lt;code&gt;Graph&lt;/code&gt; is merely a description of transformations used to derive the comprising datasets, which makes them subject to all the SparkSQL fanciness such as query optimization, whole stage code generation, and so on. Processing is delayed until an action (such as a disk write) forces it.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isAttrExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    isEdgesExploded&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    useTimestamp&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    mode&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Option&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;+M&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;&amp;lt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;](&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    definition&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;GraphDef&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;],&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    entities&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;EntityType&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;M&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;#&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;sealed&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Interactive&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkLoadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;DataFrame&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;class&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BI&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;bulkloadPortion&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Double&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; batchPeriod&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;String&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Mode&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Layout&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;BatchedEntity&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;You may notice that &lt;code&gt;Transform&lt;/code&gt; is statically typed w.r.t. &lt;code&gt;Mode&lt;/code&gt;, however other properties, like &lt;code&gt;isAttrExploded&lt;/code&gt;, or &lt;code&gt;isEdgesExploded&lt;/code&gt; are not captured in the type, and remain merely dynamic. This makes some nonsensical transformation pipelines (i.e. that explodes edges twice in a row) syntactically valid. This trade-off in compile-time safety was made to prevent overcomplicating the types.&lt;/p&gt;
+&lt;p&gt;As we already mentioned, &lt;code&gt;Graph&lt;/code&gt; is essentially a persistent container of &lt;code&gt;EntityType -&amp;gt; DataFrame&lt;/code&gt; mappings. &lt;code&gt;EntityType&lt;/code&gt; can be &lt;code&gt;Node&lt;/code&gt;, &lt;code&gt;Edge&lt;/code&gt; and &lt;code&gt;Attr&lt;/code&gt;, and is used to identify the entity and embellish with static metadata, such a descriptive name and primary key, whether it is static or dynamic (as per the specification), and in case of edges, the source and destination type and cardinality. This makes it very simple to create transformation rules on static entity properties with pattern matching.&lt;/p&gt;
+&lt;p&gt;Usually, a graph transformation involves matching entities based on their &lt;code&gt;EntityType&lt;/code&gt;, and modifying the mapping (and if required, other metadata). Take, for example, the &lt;code&gt;ExplodeAttrs&lt;/code&gt; transformation, which explodes into separate tables the values of two columns of &lt;code&gt;Person&lt;/code&gt; stored as arrays:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;object&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;extends&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Transform&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;override&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Out&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;if&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;                              &lt;span style=&#34;color:#75715e&#34;&gt;// assert at runtime that the transformation hasn&amp;#39;t been applied yet
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;throw&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;AssertionError&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Attributes already exploded in the input graph&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; node&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;DataFrame&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; column&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Column&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      attr &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; node&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;withRawColumns&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;parent&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; explode&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;split&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;column&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;;&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)).&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;s&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;${&lt;/span&gt;attr&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;attribute&lt;span style=&#34;color:#e6db74&#34;&gt;}&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;Id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; modifiedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;collect &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k &lt;span style=&#34;color:#66d9ef&#34;&gt;@&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Node&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;false&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;                &lt;span style=&#34;color:#75715e&#34;&gt;// match the Person node. This is the only one ExplodeAttrs should modify
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;EmailAddress&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonEmailEmailAddress&amp;#34; entity derived by exploding the email column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          explodedAttr&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Attr&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Speaks&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// add a new &amp;#34;PersonSpeaksLanguage&amp;#34; entity derived by exploding the language column of Person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;          k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; df&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;drop&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;email&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;language&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                             &lt;span style=&#34;color:#75715e&#34;&gt;// drop the exploded columns from person
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntities &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;_&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;                                 &lt;span style=&#34;color:#75715e&#34;&gt;// merge-replace the modified entities in the graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; updatedEntityDefinitions &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; modifiedEntities
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;foldLeft&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;e&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        e &lt;span style=&#34;color:#f92672&#34;&gt;++&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;map&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;k&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; v&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt; k &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Some&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;v&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;schema&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;toDDL&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;          &lt;span style=&#34;color:#75715e&#34;&gt;// update the entity definition schema to reflect the modifications
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;      &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; l &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; lens&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;In&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt;                                                    &lt;span style=&#34;color:#75715e&#34;&gt;// lenses provide a terse syntax for modifying nested fields
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;isAttrExploded &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;definition&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities &lt;span style=&#34;color:#f92672&#34;&gt;~&lt;/span&gt; l&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;entities&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;set&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;input&lt;span style=&#34;color:#f92672&#34;&gt;)((&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;true&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntityDefinitions&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; updatedEntities&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Note that &lt;code&gt;EntityType&lt;/code&gt; does not hold the dataset&amp;rsquo;s full SQL schema currently, as it&amp;rsquo;s not useful for pattern matching, but can be accessed directly from &lt;code&gt;DataFrame&lt;/code&gt; if needed.&lt;/p&gt;
+&lt;h1 id=&#34;inputoutput&#34;&gt;Input/output&lt;/h1&gt;
+&lt;p&gt;The &lt;code&gt;Reader&lt;/code&gt; and &lt;code&gt;Writer&lt;/code&gt; typeclasses are used to read from a &lt;code&gt;Source&lt;/code&gt; and write to a &lt;code&gt;Sink&lt;/code&gt; respectively, terminating a graph transformation pipeline&lt;br&gt;
+on both ends.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Ret&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; exists&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;T&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Boolean&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;trait&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;def&lt;/span&gt; write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;self&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Data&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;S&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;:&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;Unit&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;There are implementations under &lt;code&gt;ldbc.datagen.io.instances&lt;/code&gt; that read a graph from a &lt;code&gt;GraphSource&lt;/code&gt; and write to a &lt;code&gt;GraphSink&lt;/code&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; source &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Reader&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSource&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;read&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;source&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transform &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeAttrs&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;andThen&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;ExplodeEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; transform&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;graph&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; sink &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Writer&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GraphSink&lt;/span&gt;, &lt;span style=&#34;color:#66d9ef&#34;&gt;Graph&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;[&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;Mode.Raw.&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;type&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;]].&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; sink&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;We provide &lt;a href=&#34;https://github.com/typelevel/simulacrum&#34;&gt;Ops syntax&lt;/a&gt; to make it shorter:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.model.Mode
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.graphs.&lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;}&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.instances._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Reader.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;import&lt;/span&gt; ldbc.snb.datagen.io.Writer.ops._
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// read
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/input/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; inputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;parquet&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; graph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSource&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;model&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphs&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;Raw&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;graphDef&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; inputFormat&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;read
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// transform
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; transformedGraph &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;???&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;/* ... */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// write
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputPath &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;path/to/output/graph&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; outputFormat &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;csv&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;transformedGraph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;write&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;GraphSink&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;outputPath&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; outputFormat&lt;span style=&#34;color:#f92672&#34;&gt;))&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The reader/writer architecture is layered, the graph reader/writer uses dataframe readers/writers for each of its entities. One interesting aspect of implementing the reader was dealing with the input schema. Parquet is self-describing, however as we also support the CSV format, we had to provide a way for correct schema detection and column parsing.&lt;/p&gt;
+&lt;p&gt;Spark has a facility to derive SparkSQL schema from case classes automatically&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;. We created case classes for each entity in the &lt;code&gt;Raw&lt;/code&gt; dataset.  We also created a typeclass &lt;code&gt;EntityTraits&lt;/code&gt; associating these classes with their &lt;code&gt;EntityType&lt;/code&gt;, so we can summon them (and consequently their SparkSQL schema) in the reader.&lt;/p&gt;
+&lt;p&gt;The case classes are used during the serialization of the generated dataset too, but more about that later.&lt;/p&gt;
+&lt;h1 id=&#34;factor-generation&#34;&gt;Factor generation&lt;/h1&gt;
+&lt;p&gt;As we already mentioned, factor generation was originally part of the data generator, i.e. factor tables were calculated on the fly and emitted as side outputs. This design had some problems. Auxiliary data structures had to be maintained and interleaved with generation, which violated separation of concerns, consequently hurting readability and maintainability. Also, anything more complicated than entity local aggregates where impossible to express in the original MapReduce framework. To keep the preceding Spark rewrite at a managable scope, the original factor generation code had been removed.&lt;/p&gt;
+&lt;p&gt;We decided it&amp;rsquo;s best to reintroduce factor generation as a post-processing step that operates on the generated data. This makes it possible to express more complex analytical queries, requires no prior knowledge about the generator, can be done in SparkSQL (making it much simpler), and removes the impact on the generator&amp;rsquo;s performance, so that we can optimize them separately. Since this refactor, we almost tripled the number factor tables (up to 31 to cover both SNB workloads, BI and Interactive). The queries computing of certain factor tables even use &lt;a href=&#34;https://spark.apache.org/graphx/&#34;&gt;GraphX&lt;/a&gt;, which was unimaginable with the previous design.&lt;/p&gt;
+&lt;p&gt;Factor tables are added by extending a map with a &lt;code&gt;name -&amp;gt; Factor&lt;/code&gt; pair. &lt;code&gt;Factor&lt;/code&gt; declares is input entities, and accepts a function that receives input &lt;code&gt;DataFrames&lt;/code&gt;, and returns a single &lt;code&gt;DataFrame&lt;/code&gt; as output.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-scala&#34; data-lang=&#34;scala&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; factors &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Map&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;personDisjointEmployerPairs&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;-&amp;gt;&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Factor&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;PersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonKnowsPersonType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;OrganisationType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;PersonWorkAtCompanyType&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;{&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;    &lt;span style=&#34;color:#66d9ef&#34;&gt;case&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;Seq&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;person&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; workAt&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;=&amp;gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; knows &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; undirectedKnows&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;personKnowsPerson&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; company &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; organisation&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;where&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Type&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;cache&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      &lt;span style=&#34;color:#66d9ef&#34;&gt;val&lt;/span&gt; personSample &lt;span style=&#34;color:#66d9ef&#34;&gt;=&lt;/span&gt; person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;orderBy&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;$&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;limit&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;      personSample
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;knows&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.person2Id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;workAt&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.PersonId&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;knows.Person1id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;join&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;company&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;as&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#f92672&#34;&gt;===&lt;/span&gt; $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;workAt.CompanyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;select&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.name&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyName&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Company.id&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;companyId&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2creationDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;),&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;          $&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Person2.deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;alias&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;person2deletionDate&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;        &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;distinct&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;},&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#75715e&#34;&gt;/* more factors */&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As you can see, it&amp;rsquo;s not much complicated than using plain SQL, with the added benefit of being able to extract recurring subqueries to functions (e.g. &lt;code&gt;undirectedKnows&lt;/code&gt;). Currently, there&amp;rsquo;s no parallelization between different factor tables (although each of them is parallelized internally by Spark). The Factor table writer uses the same componentized architecture as the graph writer, i.e. it uses the dataframe writer under the hood.&lt;/p&gt;
+&lt;h1 id=&#34;revamping-the-data-generators-serializer&#34;&gt;Revamping the data generator&amp;rsquo;s serializer&lt;/h1&gt;
+&lt;p&gt;At this point, both the transformation pipeline and factor generator was ready, however the data generator was still chugging with the old serializer, emitting the IR in CSV. We wanted to move this to Parquet to improve performance and reduce its size, but there was a problem: due to the generator&amp;rsquo;s custom data representation, SparkSQL (and its DataSource API) was off-limits. So we&amp;rsquo;ve bitten the bullet, and rewritten the existing serializer to emit Parquet.&lt;/p&gt;
+&lt;blockquote&gt;
+&lt;p&gt;&lt;a href=&#34;https://parquet.apache.org/&#34;&gt;Parquet&lt;/a&gt; is an open source data format that evolved to be the de facto standard for Big Data batch pipelines. It offers a column-oriented, compressed, schemaful representation that is space-efficient and suited for analytic queries. The file format leverages a record shredding and assembly model, which originated at Google. This results in a file that is optimized for query performance and minimizing I/O.&lt;/p&gt;
+&lt;/blockquote&gt;
+&lt;p&gt;The new serialization framework is heavily influenced by the design of Java &lt;code&gt;OutputStreams&lt;/code&gt;, in the sense that stateful objects are composed to form a pipeline. For example, in case of &lt;em&gt;activities&lt;/em&gt;, the input is an activity tree, and the output is a set of rows in multiple files (eg. forum, forumHasTag, post, postHasTag, etc.). The components that take part in activity serialization are shown on the diagram below. The activity tree is iterated (1st component) and the corresponding entity serializer is called (2nd component), which is fed into a component that splits the records (3rd one) among several output streams writing individual files (last).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;activity.png&#34; alt=&#34;Activity serialization pipeline&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The benefit of this architecture is that only the last component needs to change when we add support for a new output format.&lt;/p&gt;
+&lt;p&gt;To support Parquet, we made use of row-level serializers available in Hadoop&amp;rsquo;s Parquet library (bundled with SparkSQL), and internal classes in SparkSQL to derive Parquet schema for our entities. Remember how we used case classes for the &lt;code&gt;Raw&lt;/code&gt; entities to derive the input schema in the graph reader during dataset transformation? Here we use the same classes (e.g. &lt;code&gt;Forum&lt;/code&gt;) and Spark&amp;rsquo;s &lt;code&gt;Encoder&lt;/code&gt; framework to encode the entities in Parquet, which means that the generated output remains consistent with &lt;code&gt;DataFrame&lt;/code&gt;-based reader, and we spare a lot of code duplication.&lt;/p&gt;
+&lt;h1 id=&#34;optimizations&#34;&gt;Optimizations&lt;/h1&gt;
+&lt;p&gt;After these refactors, we were able to generate the BI dataset with scale factor 10K on 300 i3.4xlarge machines in one hour. Decreasing the number of machines resulted in out of memory errors in the generator. We realized partition sizes (and thus the number of partitions) should be determined based on available memory. Our experiments showed that a machine with 128GB of memory is capable of generating SF3K (scale factor 3000) reliably with 3 blocks&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; per partition given ample disk size to allow for spills (tested with 3.8TB); while less partitions (subsequently, larger block/partition ratio) would introduce OOM errors. Furthermore, we split the data generator output after a certain number of rows written, to fend against the skew between different kinds of entities possibly causing problems during transformation&lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt;. These optimizations enabled us to run SF10K reliably on 4 i3.4xlarge machines in 11 hours (which is still more than 6x reduction in cost). We weren&amp;rsquo;t able to run SF30K run on 10 machines (1 machine / SF3K), even 15 ran out of disk. This non-linear disk use should be investigated further as it complicates calculating cluster sizes for larger scale factors.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf3k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;330&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;./tools/emr/submit_datagen_job.py sf10k_bi &lt;span style=&#34;color:#ae81ff&#34;&gt;10000&lt;/span&gt; parquet bi &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --sf-per-executor &lt;span style=&#34;color:#ae81ff&#34;&gt;3000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --partitions &lt;span style=&#34;color:#ae81ff&#34;&gt;1000&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --jar $JAR_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --instance-type i3.4xlarge &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  --bucket $BUCKET_NAME &lt;span style=&#34;color:#ae81ff&#34;&gt;\
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;&lt;/span&gt;  -- --explode-edges --explode-attrs
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The above examples working configurations for generating the 3K and 10K BI datasets. The &lt;code&gt;--sf-per-executor&lt;/code&gt; option controls the number of worker nodes allocated, in this case 1 node per every 3000 SF, i.e. 1 and 4 nodes correspondingly. The &lt;code&gt;--partitions&lt;/code&gt; option controls the total number of partitions, and was calculated based on the number of persons using the formula &lt;code&gt;partitions = ceil(number_of_persons / block_size / 3)&lt;/code&gt; to get a maximum of 3 blocks per partition.&lt;/p&gt;
+&lt;h1 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h1&gt;
+&lt;p&gt;These improvements made LDBC SNB datagen more modular, maintainable and efficient, costing under a cent per scale factor to generate the BI dataset, which enables us to generate datasets beyond SF 100K.&lt;/p&gt;
+&lt;h1 id=&#34;footnotes&#34;&gt;Footnotes&lt;/h1&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;The generator produces hierarchies, such as forum wall with a random number of posts, that have comments, etc. This tree is iterated, and different entities are written to separate files.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;Shameless plug: You can learn more on this from &lt;a href=&#34;https://www.dataversity.net/case-study-deriving-spark-encoders-and-schemas-using-implicits/&#34;&gt;another blogpost of mine&lt;/a&gt;.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;The datagenerator produces blocks of 10,000 persons and their related entities. Entities from different blocks are unrelated (isolated).&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;The maximum row count per file is currently 10M, however, this can be modified with a command line option. We also had an alternative design in mind where this number would have been determined based on the average row size of each entity, however, we stayed with the first version for simplicity.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</link>
+      <pubDate>Fri, 17 Jun 2022 09:20:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;&lt;strong&gt;Organizers:&lt;/strong&gt; Gábor Szárnyas, Jack Waudby, Peter Boncz, Alastair Green&lt;/p&gt;
+&lt;p&gt;LDBC is hosting a &lt;strong&gt;two-day&lt;/strong&gt; hybrid workshop, co-located with &lt;a href=&#34;https://2022.sigmod.org/venue.shtml&#34;&gt;SIGMOD 2022&lt;/a&gt; on &lt;strong&gt;June 17-18 (Friday-Saturday)&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The program consists of 10-15 minute talks followed by a Q&amp;amp;A session. The talks will be recorded and made available online.&lt;br&gt;
+The tenative program is the following. &lt;strong&gt;All times are in EDT.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;We will have a social event on Friday at 17:30 at &lt;a href=&#34;https://elvezrestaurant.com/&#34;&gt;El Vez&lt;/a&gt; (&lt;a href=&#34;https://g.page/ElVezPhilly&#34;&gt;Google Maps&lt;/a&gt;).&lt;/p&gt;
+&lt;h4 id=&#34;friday-pennsylvania-convention-centerhttpswwwpaconventioncom-room-204bhttps2022sigmodorgprogramshtml&#34;&gt;Friday (&lt;a href=&#34;https://www.paconvention.com/&#34;&gt;Pennsylvania Convention Center&lt;/a&gt;, &lt;a href=&#34;https://2022.sigmod.org/program.shtml&#34;&gt;room 204B&lt;/a&gt;)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;09:20&lt;/td&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;Peter Boncz (LDBC/CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/39BoOIGk9Is&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:30&lt;/td&gt;
+&lt;td&gt;09:45&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/Birkbeck)&lt;/td&gt;
+&lt;td&gt;LDBC&amp;rsquo;s fair use policies – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-fair-use-of-the-ldbc-trademark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/7zmCysN4Rpg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;09:50&lt;/td&gt;
+&lt;td&gt;10:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Business Intelligence workload v1.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/gabor-szarnyas-the-ldbc-social-network-benchmark-business-intelligence-workload.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/AJ96M8_njxE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:10&lt;/td&gt;
+&lt;td&gt;10:25&lt;/td&gt;
+&lt;td&gt;Heng Lin (Ant Group)&lt;/td&gt;
+&lt;td&gt;LDBC Financial Benchmark introduction – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/heng-lin-ldbc-financial-benchmark-introduction.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iBhud_YjafY&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:30&lt;/td&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;coffee break&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Chen Zhang (CreateLink)&lt;/td&gt;
+&lt;td&gt;New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/chen-zhang-new-ldbc-snb-benchmark-record-by-galaxybase-more-than-6-times-faster-and-70-percent-higher-throughput.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/sMzTsb8iw_Y&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;James Clarkson (Neo4j)&lt;/td&gt;
+&lt;td&gt;LDBC benchmarks: Promoting good science and industrial consumption – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/james-clarkson-ldbc-benchmarks-promoting-good-science-and-industrial-consumption.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VYG1mzcl9qQ&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Oskar van Rest (Oracle)&lt;/td&gt;
+&lt;td&gt;Creating and querying property graphs in Oracle, on-premise and in the cloud – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oskar-van-rest-creating-and-querying-property-graphs-in-oracle-on-premise-and-in-the-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/2HX2Vixf2gs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;12:15&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;Conquering LDBC SNB BI at SF-10k – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/mingxi-wu-conquering-ldbc-snb-bi-at-sf10k.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/oJbqzQ_t3G8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:20&lt;/td&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;13:35&lt;/td&gt;
+&lt;td&gt;Altan Birler (Technische Universität München)&lt;/td&gt;
+&lt;td&gt;Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/altan-birler-relational-databases-can-handle-graphs-too.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cRgbdY3I2i4&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;13:55&lt;/td&gt;
+&lt;td&gt;David Püroja (CWI)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark: Interactive workload v2.0 – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/david-puroja-ldbc-snb-interactive-workload-v2.0.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;14:15&lt;/td&gt;
+&lt;td&gt;Angela Bonifati (Lyon 1 University)&lt;/td&gt;
+&lt;td&gt;The quest for schemas in graph databases – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/angela-bonifati-the-quest-for-schemas-in-graph-databases.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/VT7cx3Jp7V8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;14:35&lt;/td&gt;
+&lt;td&gt;Matteo Lissandrini (Aalborg University)&lt;/td&gt;
+&lt;td&gt;Understanding graph data representations in triplestores – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/matteo-lissandrini-understanding-graph-data-representations-in-triplestores.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xqVMJZfh_JU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;14:55&lt;/td&gt;
+&lt;td&gt;Wim Martens (University of Bayreuth)&lt;/td&gt;
+&lt;td&gt;Path representations – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/wim-martens-path-representations.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/Ma-E5dwgf-E&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:00&lt;/td&gt;
+&lt;td&gt;15:20&lt;/td&gt;
+&lt;td&gt;Audrey Cheng	(UC Berkeley)&lt;/td&gt;
+&lt;td&gt;TAOBench: An end-to-end benchmark for social network workloads – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/audrey-cheng-taobench.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/1p8AStxS3es&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h4 id=&#34;saturday-philadelphia-marriott-downtownhttpswwwmarriottcomen-ushotelsphldt-philadelphia-marriott-downtown-room-401-402-4th-floor&#34;&gt;Saturday (&lt;a href=&#34;https://www.marriott.com/en-us/hotels/phldt-philadelphia-marriott-downtown/&#34;&gt;Philadelphia Marriott Downtown&lt;/a&gt;, room 401-402, 4th floor)&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;finish&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;10:15&lt;/td&gt;
+&lt;td&gt;Keith Hare (WG3)&lt;/td&gt;
+&lt;td&gt;An update on the GQL &amp;amp; SQL/PGQ standards efforts – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/keith-hare-property-graph-standards-process-and-timing.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xFVD3LWnKlc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;10:35&lt;/td&gt;
+&lt;td&gt;Leonid Libkin (ENS Paris)&lt;/td&gt;
+&lt;td&gt;Pattern matching in GQL and SQL/PGQ  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/leonid-libkin-pattern-matching-in-gql-and-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/OvGsa0qLANE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:40&lt;/td&gt;
+&lt;td&gt;10:55&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j/WG3)&lt;/td&gt;
+&lt;td&gt;An overview of GQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/petra-selmer-towards-gql-v1-a-property-graph-query-language-standard.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tncf2FgyIyo&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:00&lt;/td&gt;
+&lt;td&gt;11:15&lt;/td&gt;
+&lt;td&gt;Alastair Green (LDBC/WG3)&lt;/td&gt;
+&lt;td&gt;GQL 2.0: A technical manifesto – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/alastair-green-gql-2.0-a-technical-manifesto.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/upIvpYy8C2g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:20&lt;/td&gt;
+&lt;td&gt;11:35&lt;/td&gt;
+&lt;td&gt;George Fletcher (TU Eindhoven)&lt;/td&gt;
+&lt;td&gt;PG-Keys (LDBC Property Graph Schema Working Group) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/george-fletcher-pg-keys-keys-for-property-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_W8-jOtcObc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:40&lt;/td&gt;
+&lt;td&gt;11:55&lt;/td&gt;
+&lt;td&gt;Arvind Shyamsundar (Microsoft)&lt;/td&gt;
+&lt;td&gt;Graph capabilities in Microsoft SQL Server and Azure SQL Database – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/arvind-shyamsundar-graph-capabilities-in-microsoft-sql-server-and-azure-database.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/xxV2BfZupGw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;&lt;em&gt;lunch (on your own)&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:30&lt;/td&gt;
+&lt;td&gt;13:45&lt;/td&gt;
+&lt;td&gt;Daniël ten Wolde (CWI)&lt;/td&gt;
+&lt;td&gt;Implementing SQL/PGQ in DuckDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/daniel-ten-wolde-implementing-sql-pgq-in-duckdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/JmSfU0BTH5w&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:50&lt;/td&gt;
+&lt;td&gt;14:05&lt;/td&gt;
+&lt;td&gt;Oszkár Semeráth, Kristóf Marussy (TU Budapest)&lt;/td&gt;
+&lt;td&gt;Generation techniques for consistent, realistic, diverse, and scalable graphs – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/oszkar-semerath-generation-techniques-for-consistent-realistic-diverse-and-scalable-graphs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/hB6j6mvh-vA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:10&lt;/td&gt;
+&lt;td&gt;14:25&lt;/td&gt;
+&lt;td&gt;Molham Aref (RelationalAI)&lt;/td&gt;
+&lt;td&gt;Graph Normal Form – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/molham-aref-graph-normal-form.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/-kP4Raqr5KA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:30&lt;/td&gt;
+&lt;td&gt;14:45&lt;/td&gt;
+&lt;td&gt;Naomi Arnold (Queen Mary University of London)&lt;/td&gt;
+&lt;td&gt;Temporal graph analysis of the far-right social network Gab – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/naomi-arnold-temporal-graph-analysis-of-the-far-right-social-network-gab.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ugSkFlif4PE&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:50&lt;/td&gt;
+&lt;td&gt;15:05&lt;/td&gt;
+&lt;td&gt;Domagoj Vrgoč (PUC Chile)&lt;/td&gt;
+&lt;td&gt;Evaluating path queries in MillenniumDB – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/domagoj-vrgoc-regular-path-queries-in-millenniumdb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/_OzJ6vI7GNU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;15:25&lt;/td&gt;
+&lt;td&gt;Pavel Klinov, Evren Sirin (Stardog)&lt;/td&gt;
+&lt;td&gt;Stardog&amp;rsquo;s experience with LDBC – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifteenth-tuc-meeting/attachments/evren-sirin-stardog-experience-with-ldbc.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/CBrEeOTqGKM&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Announcing the LDBC Financial Benchmark Task Force</title>
+      <link>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</link>
+      <pubDate>Thu, 26 May 2022 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/announcing-the-ldbc-financial-benchmark-task-force/</guid>
+      <description>&lt;p&gt;We are delighted to announce the set up of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/&#34;&gt;Financial Benchmark (FinBench) task force&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The Financial Benchmark (FinBench) project aims to define a graph database evaluating benchmark and develop a data generation process and a query driver to make the evaluation of the graph database representative, reliable and comparable, especially in financial scenarios, such as anti-fraud and risk control. The FinBench is scheduled to be released in the end of 2022.&lt;/p&gt;
+&lt;p&gt;Compared to LDBC SNB, the FinBench will differ in application scenarios, data patterns, and workloads, resulting in different schema characteristics, latency bounds, path filters, etc. FinBench is going to redesign the data pattern and workloads, including the data generation, the query driver, and also some other facilities referred to LDBC SNB.&lt;/p&gt;
+&lt;p&gt;The FinBench Task Force was approved by LDBC on May 16, 2022. The FinBench Task Force is led by Ant Group, and the initial members also include Pometry, Create Link, StarGraph, Ultipa, Katana, Intel, Memgraph (observer) and Koji Annoura (individual member). See the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/finbench/ldbc-finbench-work-charter.pdf&#34;&gt;Work Charter for FinBench&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;If you are interested in joining FinBench Task Force, please reach out at info at ldbcouncil.org or guozhihui.gzh at antgroup.com.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</link>
+      <pubDate>Mon, 16 Aug 2021 16:00:00 +0200</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC was hosting a one-day hybrid workshop, co-located with &lt;a href=&#34;https://vldb.org/2021/&#34;&gt;VLDB 2021&lt;/a&gt; on &lt;strong&gt;August 16 (Monday) between 16:00–20:00 CEST&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The physical part of the workshop was held in room Akvariet 2 of the &lt;a href=&#34;https://www.tivolihotel.com/&#34;&gt;Tivoli Hotel&lt;/a&gt; (Copenhagen), while the virtual part was hosted on Zoom. Our programme consisted of talks that provide an overview of LDBC&amp;rsquo;s recent efforts. Moreover, we have invited industry practitioners and academic researchers to present their latest results.&lt;/p&gt;
+&lt;p&gt;Talks were scheduled to be 10 minutes with a short Q&amp;amp;A session. We had three sessions. Their schedules are shown below.&lt;/p&gt;
+&lt;h4 id=&#34;16001725-cest-ldbc-updates-benchmarks-query-languages&#34;&gt;[16:00–17:25 CEST] LDBC updates, benchmarks, query languages&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;16:00&lt;/td&gt;
+&lt;td&gt;Peter Boncz (CWI)&lt;/td&gt;
+&lt;td&gt;State of the union – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/peter-boncz-state-of-the-union.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:05&lt;/td&gt;
+&lt;td&gt;Gábor Szárnyas (CWI)&lt;/td&gt;
+&lt;td&gt;Overview of LDBC benchmarks – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/gabor-szarnyas-ldbc-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:12&lt;/td&gt;
+&lt;td&gt;Mingxi Wu (TigerGraph)&lt;/td&gt;
+&lt;td&gt;LDBC Social Network Benchmark results with TigerGraph – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mingxi-wu-tigergraph-snb-preliminary-results.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:24&lt;/td&gt;
+&lt;td&gt;Xiaowei Zhu (Ant Group)&lt;/td&gt;
+&lt;td&gt;Financial Benchmark proposal – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/xiaowei-zhu-financial-benchmark.pdf&#34;&gt;slides&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:36&lt;/td&gt;
+&lt;td&gt;Petra Selmer (Neo4j)&lt;/td&gt;
+&lt;td&gt;Status report from the Existing Languages Working Group (ELWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/petra-selmer-elwg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/I5A8VuFDhsA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:48&lt;/td&gt;
+&lt;td&gt;Jan Hidders (Birkbeck)&lt;/td&gt;
+&lt;td&gt;Status report from the Property Graph Schema Working Group (PGSWG) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/jan-hidders-pgswg.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/iEbVi9T-HVk&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;Keith Hare (JCC Consulting)&lt;/td&gt;
+&lt;td&gt;Database Language Standards Structure and Process, SQL/PGQ – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/keith-hare-database-language-standards-structure-and-process-sql-pgq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/ZgFCuzods4g&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:12&lt;/td&gt;
+&lt;td&gt;Stefan Plantikow (GQL Editor)&lt;/td&gt;
+&lt;td&gt;Report on the GQL standard – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/stefan-plantikow-gql.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/z0pN5NwKsgc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;17351845-cest-systems-and-data-structures&#34;&gt;[17:35–18:45 CEST] Systems and data structures&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;17:35&lt;/td&gt;
+&lt;td&gt;Vasileios Trigonakis (Oracle Labs)&lt;/td&gt;
+&lt;td&gt;PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasileios-trigonakis-pgxd-adfs.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/cv2ZfWRBOek&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:47&lt;/td&gt;
+&lt;td&gt;Matthias Hauck (SAP)&lt;/td&gt;
+&lt;td&gt;JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/matthias-hauck-json-spatial-graph-sap-hana-cloud.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/dgpMJFho6Q8&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:59&lt;/td&gt;
+&lt;td&gt;Nikolay Yakovets (Eindhoven University of Technology)&lt;/td&gt;
+&lt;td&gt;AvantGraph  – &lt;a href=&#34;https://youtu.be/z0pN5NwKsgcttachments/nikolay-yakovets-avantgraph.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/9M9FOycovTw&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:11&lt;/td&gt;
+&lt;td&gt;Semih Salihoglu (University of Waterloo)&lt;/td&gt;
+&lt;td&gt;GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semih-salihoglu-graindb.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/FFK3y6vPHJs&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:23&lt;/td&gt;
+&lt;td&gt;Semyon Grigorev (Saint Petersburg University)&lt;/td&gt;
+&lt;td&gt;Context-free path querying: Obstacles on the way to adoption  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/semyon-grigorev-cfpq.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/pha1xIpEL3I&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;18:35&lt;/td&gt;
+&lt;td&gt;Per Fuchs (Technical University of Munich)&lt;/td&gt;
+&lt;td&gt;Sortledton: A universal, transactional graph data structure  – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/per-fuchs-sortledton.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/33ZjsNN0hhU&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;&lt;em&gt;coffee break (10 minutes)&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;1855-2000-cest-high-level-approaches-and-benchmarks&#34;&gt;[18:55-20:00 CEST] High-level approaches and benchmarks&lt;/h4&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start&lt;/th&gt;
+&lt;th&gt;speaker&lt;/th&gt;
+&lt;th&gt;title&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;18:55&lt;/td&gt;
+&lt;td&gt;Angelos-Christos Anadiotis (Ecole Polytechnique and Institut Polytechnique de Paris)&lt;/td&gt;
+&lt;td&gt;Empowering Investigative Journalism with Graph-based Heterogeneous Data Management – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/angelos-christos-anadiotis-investigative-journalism-graph-data-management.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/a1VYjyec8dg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:07&lt;/td&gt;
+&lt;td&gt;Vasia Kalavri (Boston University)&lt;/td&gt;
+&lt;td&gt;Learning to partition unbounded graph streams – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/vasia-kalavri-learning-to-partition-unbounded-graph-streams.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/PTlUABKWniA&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:19&lt;/td&gt;
+&lt;td&gt;Muhammad Attahir Jibril (TU Ilmenau)&lt;/td&gt;
+&lt;td&gt;Towards a Hybrid OLTP-OLAP Graph Benchmark – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/muhammad-attahir-jibril-hybrid-oltp-olap-benchmark.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/tMBVszTSJXc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:31&lt;/td&gt;
+&lt;td&gt;Riccardo Tommasini (University of Tartu)&lt;/td&gt;
+&lt;td&gt;An outlook on Benchmarks for Graph Stream Processing – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/riccardo-tommasini-graph-stream-processing-benchmarks.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/HabvJvPXsLc&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;19:43&lt;/td&gt;
+&lt;td&gt;Mohamed Ragab (University of Tartu)&lt;/td&gt;
+&lt;td&gt;Benchranking: Towards prescriptive analysis of big graph processing: the case of SparkSQL – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourteenth-tuc-meeting/attachments/mohamed-ragab-benchranking.pdf&#34;&gt;slides&lt;/a&gt;, &lt;a href=&#34;https://youtu.be/mZ8LhGUq7Wg&#34;&gt;video&lt;/a&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Thirteenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</link>
+      <pubDate>Tue, 30 Jun 2020 14:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/thirteenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Thirteenth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry – LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a two-day event hosted online. We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Gabor Szarnyas (BME) to register.&lt;/p&gt;
+&lt;h3 id=&#34;snb-task-force&#34;&gt;SNB Task Force&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;Progress report
+&lt;ul&gt;
+&lt;li&gt;ACID compliance test suite&lt;/li&gt;
+&lt;li&gt;Integrating deletions to Datagen&lt;/li&gt;
+&lt;li&gt;Migrating Datagen to Spark&lt;/li&gt;
+&lt;li&gt;Redesign of BI read queries&lt;/li&gt;
+&lt;li&gt;Extensions to the driver&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;Ongoing work
+&lt;ul&gt;
+&lt;li&gt;Datagen: tuning the distribution of deletes&lt;/li&gt;
+&lt;li&gt;Interactive 2.0 workload&lt;/li&gt;
+&lt;li&gt;BI 1.0 workload&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Zoom links will be sent through email.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Speeding Up LDBC SNB Datagen</title>
+      <link>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</link>
+      <pubDate>Fri, 12 Jun 2020 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/speeding-up-ldbc-snb-datagen/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;#references&#34;&gt;Social Network Benchmark [4]&lt;/a&gt; (LDBC SNB) is an industrial and academic initiative, formed by principal actors in the field of graph-like data management. Its goal is to define a framework where different graph-based technologies can be fairly tested and compared, that can drive the identification of systems&amp;rsquo; bottlenecks and required functionalities, and can help researchers open new frontiers in high-performance graph data management.&lt;/p&gt;
+&lt;p&gt;LDBC SNB provides &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;Datagen&lt;/a&gt; (Data Generator), which produces synthetic datasets, mimicking a social network&amp;rsquo;s activity during a period of time. Datagen is defined by the charasteristics of realism, scalability, determinism and usability. To address scalability in particular, Datagen has been implemented on the MapReduce computation model to enable scaling out across a distributed cluster. However, since its inception in the early 2010s there has been a tremendous amount of development in the big data landscape, both in the sophistication of distributed processing platforms, as well as public cloud IaaS offerings. In the light of this, we should reevaluate this implementation, and in particular, investigate if Apache Spark would be a more cost-effective solution for generating datasets on the scale of tens of terabytes, on public clouds such as Amazon Web Services (AWS).&lt;/p&gt;
+&lt;h2 id=&#34;overview&#34;&gt;Overview&lt;/h2&gt;
+&lt;p&gt;The benchmark&amp;rsquo;s specification describes a social network &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs/blob/9253abbde94ec7eaccd366c5d4c15cca30752e36/figures/schema-comfortable.pdf&#34;&gt;data model&lt;/a&gt; which divides its components into two broad categories: static and dynamic. The dynamic element consists of an evolving network where people make friends, post in forums, comment or like each others posts, etc. In contrast, the static component contains related attributes such as countries, universities and organizations and are fixed values. For the detailed specifications of the benchmark and the Datagen component, see &lt;a href=&#34;#references&#34;&gt;References&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;Datasets are generated in a multi-stage process captured as a sequence of MapReduce steps (shown in the diagram below).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;datagen_flow.png&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 1. LDBC SNB Datagen Process on Hadoop&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;In the initialization phase dictionaries are populated and distributions are initialized. In the first generation phase persons are synthesized, then relationships are wired between them along 3 dimensions (university, interest and random). After merging the graph of person relationships, the resulting dataset is output. Following this, activities such as forum posts, comments, likes and photos are generated and output. Finally, the static components are output.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Note: The diagram shows the call sequence as implemented. All steps are sequential &amp;ndash; including the relationship generation &amp;ndash;, even in cases when the data dependencies would allow for parallelization.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Entities are generated by procedural Java code and are represented as POJOs in memory and as sequence files on disk. Most entities follow a shallow representation, i.e foreign keys (in relational terms) are mapped to integer ids, which makes serialization straightforward.&lt;sup id=&#34;fnref:1&#34;&gt;&lt;a href=&#34;#fn:1&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;1&lt;/a&gt;&lt;/sup&gt; A notable exception is the Knows edge which contains only the target vertex, and is used as a navigation property on the source Person. The target Person is replaced with only the foreign key augmented with some additional information in order to keep the structure free of cycles. Needless to say, this &lt;em&gt;edge as property&lt;/em&gt; representation makes the data harder to handle in SQL than it would be with a flat join table.&lt;/p&gt;
+&lt;p&gt;Entity generation amounts to roughly one fifth of the main codebase. It generates properties drawn from several random distributions using mutable pRNGs. Determinism is achieved by initializing the pRNGs to seeds that are fully defined by the configuration with constants, and otherwise having no external state in the logic.&lt;sup id=&#34;fnref:2&#34;&gt;&lt;a href=&#34;#fn:2&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;2&lt;/a&gt;&lt;/sup&gt;&lt;/p&gt;
+&lt;p&gt;Serialization is done by hand-written serializers for the supported output formats (e.g. CSV) and comprises just a bit less than one third of the main codebase. Most of the output is created by directly interacting with low-level HDFS file streams. Ideally, this code should be migrated to higher-level writers that handle faults and give consistent results when the task has to be restarted.&lt;/p&gt;
+&lt;h2 id=&#34;motivations-for-the-migration&#34;&gt;Motivations for the migration&lt;/h2&gt;
+&lt;p&gt;The application is written using Hadoop MapReduce, which is now largely superseded by more modern distributed batch processing platforms, notably Apache Spark. For this reason, it was proposed to migrate Datagen to Spark. The migration provides the following benefits:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Better memory utilization:&lt;/strong&gt; MapReduce is disk-oriented, i.e. it writes the output to disk after each reduce stage which is then read by the next MapReduce job. As public clouds provide virtual machines with sufficient RAM to encapsulate any generated dataset, time and money are wasted by the overhead this unnecessary disk I/O incurs. Instead, the intermediate results should be cached in memory where possible. The lack of support for this is a well-known limitation of MapReduce.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Smaller codebase:&lt;/strong&gt; The Hadoop MapReduce library is fairly ceremonial and boilerplatey. Spark provides a higher-level abstraction that is simpler to work with, while still providing enough control on the lower-level details required for this workload.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Small entry cost:&lt;/strong&gt; Spark and MapReduce are very close conceptually, they both utilise HDFS under the hood, and run on the JVM. This means that a large chunk of the existing code can be reused, and migration to Spark can, therefore, be completed with relatively small effort. Additionally, MapReduce and Spark jobs can be run on AWS EMR using basically the same HW/SW configuration, which facilitates straightforward performance comparisons.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Incremental improvements:&lt;/strong&gt; Spark exposes multiple APIs for different workloads and operating on different levels of abstraction. Datagen may initially utilise the lower-level, Java-oriented RDDs (which offer the clearest 1 to 1 mapping when coming from MapReduce) and gradually move towards DataFrames to support Parquet output in the serializers and maybe unlock some SQL optimization capabilities in the generators later down the road.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;OSS, commodity:&lt;/strong&gt; Spark is one of the most widely used open-source big data platforms. Every major public cloud provides a managed offering for Spark. Together these mean that the migration increases the approachability and portability of the code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;first-steps&#34;&gt;First steps&lt;/h2&gt;
+&lt;p&gt;The first milestone is a successful run of LDBC Datagen on Spark while making the minimum necessary amount of code alterations. This entails the migration of the Hadoop wrappers around the generators and serializers. The following bullet-points summarize the key notions that cropped up during the process.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Use your memory:&lt;/strong&gt; A strong focus was placed on keeping the call sequence intact, so that the migrated code evaluates the same steps in the same order, but with data passed as RDDs. It was hypothesised that the required data could be either cached in memory entirely at all times, or if not, regenerating them would still be faster than involving the disk I/O loop (e.g. by using &lt;code&gt;MEMORY_AND_DISK&lt;/code&gt;). In short, the default caching strategy was used everywhere.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Regression tests:&lt;/strong&gt; Lacking tests apart from an id uniqueness check, meant there were no means to detect bugs introduced by the migration. Designing and implementing a comprehensive test suite was out of scope, so instead, regression testing was utilised, with the MapReduce output as the baseline. The original output mostly consists of Hadoop sequence files which can be read into Spark, allowing comparisons to be drawn with the output from the RDD produced by the migrated code.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Thread-safety concerns:&lt;/strong&gt; Soon after migrating the first generator and running the regression tests, there were clear discrepancies in the output. These only surfaced when the parallelization level was set greater than 1. This indicated the presence of potential race conditions. Thread-safety wasn&amp;rsquo;t a concern in the original implementation due to the fact that MapReduce doesn&amp;rsquo;t use thread-based parallelization for mappers and reducers.&lt;sup id=&#34;fnref:3&#34;&gt;&lt;a href=&#34;#fn:3&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;3&lt;/a&gt;&lt;/sup&gt; In Spark however, tasks are executed by parallel threads in the same JVM application, so the code is required to be thread-safe. After some debugging, a bug was discovered originating from the shared use of java.text.SimpleDateFormat (notoriously known to be not thread-safe) in the serializers. This was resolved simply by changing to java.time.format.DateTimeFormatter. There were multiple instances of some static field on an object being mutated concurrently. In some cases this was a temporary buffer and was easily resolved by making it an instance variable. In another case a shared context variable was used, which was resolved by passing dedicated instances as function arguments. Sadly, the Java language has the same syntax for accessing locals, fields and statics, &lt;sup id=&#34;fnref:4&#34;&gt;&lt;a href=&#34;#fn:4&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;4&lt;/a&gt;&lt;/sup&gt; which makes it somewhat harder to find potential unguarded shared variables.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h2 id=&#34;case-study-person-ranking&#34;&gt;Case study: Person ranking&lt;/h2&gt;
+&lt;p&gt;Migrating was rather straightforward, however, the so-called person ranking step required some thought. The goal of this step is to organize persons so that similar ones appear close to each other in a deterministic order. This provides a scalable way to cluster persons according to a similarity metric, as introduced in the &lt;a href=&#34;#references&#34;&gt;S3G2 paper [3]&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;the-original-mapreduce-version&#34;&gt;The original MapReduce version&lt;/h3&gt;
+&lt;p&gt;&lt;img src=&#34;person_ranking.svg&#34; alt=&#34;&#34;&gt; \ &lt;em&gt;Figure 2. Diagram of the MapReduce code for ranking persons&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;The implementation, shown in pseudocode above, works as follows:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The equivalence keys are mapped to each person and fed into TotalOrderPartitioner which maintains an order sensitive partitioning while trying to emit more or less equal sized groups to keep the data skew low.&lt;/li&gt;
+&lt;li&gt;The reducer keys the partitions with its own task id and a counter variable which has been initialized to zero and incremented on each person, establishing a local ranking inside the group. The final state of the counter (which is the total number of persons in that group) is saved to a separate &amp;ldquo;side-channel&amp;rdquo; file upon the completion of a reduce task.&lt;/li&gt;
+&lt;li&gt;In a consecutive reduce-only stage, the global order is established by reading all of these previously emitted count files in the order of their partition number in each reducer, then creating an ordered map from each partition number to the corresponding cumulative count of persons found in all preceding ones. This is done in the setup phase. In the reduce function, the respective count is incremented and assigned to each person.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Once this ranking is done, the whole range is sliced up into equally sized blocks, which are processed independently. For example, when wiring relationships between persons, only those appearing in the same block are considered.&lt;/p&gt;
+&lt;h3 id=&#34;the-migrated-version&#34;&gt;The migrated version&lt;/h3&gt;
+&lt;p&gt;Spark provides a sortBy function which takes care of the first step above in a single line. The gist of the problem remains collecting the partition sizes and making them available in a later step. While the MapReduce version uses a side output, in Spark the partition sizes are collected in a separate job and passed into the next phase using a broadcast variable. The resulting code size is a fraction of the original one.&lt;/p&gt;
+&lt;h2 id=&#34;benchmarks&#34;&gt;Benchmarks&lt;/h2&gt;
+&lt;p&gt;Benchmarks were carried out on AWS &lt;a href=&#34;https://aws.amazon.com/emr/&#34;&gt;EMR&lt;/a&gt;, originally utilising &lt;a href=&#34;https://aws.amazon.com/ec2/instance-types/i3/&#34;&gt;i3.xlarge&lt;/a&gt; instances because of their fast NVMe SSD storage and ample amount of RAM.&lt;/p&gt;
+&lt;p&gt;The application parameter hadoop.numThreads controls the number of reduce threads in each Hadoop job for the MapReduce version and the number of partitions in the serialization jobs in the Spark one. For MapReduce, this was set to n_nodes, i.e. the number of machines; experimentation yield slowdowns for higher values. The Spark version on the other hand, performed better with this parameter set to n_nodes * v_cpu. The scale factor (SF) parameter determines the output size. It is defined so that one SF unit generates around 1 GB of data. That is, SF10 generates around 10 GB, SF30 around 30 GB, etc. It should be noted however, that incidentally the output was only 60% of this in these experiments, stemming from two reasons. One, update stream serialization was not migrated to Spark, due to problems in the original implementation. Of course, for the purpose of faithful comparison the corresponding code was removed from the MapReduce version as well before executing the benchmarks. This explains a 10% reduction from the expected size. The rest can be attributed to incorrectly tuned parameters.&lt;sup id=&#34;fnref:5&#34;&gt;&lt;a href=&#34;#fn:5&#34; class=&#34;footnote-ref&#34; role=&#34;doc-noteref&#34;&gt;5&lt;/a&gt;&lt;/sup&gt; The MapReduce results were as follows:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;1.60&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;1.13&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;40&lt;/td&gt;
+&lt;td&gt;1.20&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;MapReduce&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;1.32&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;It can be observed that the runtime per scale factor only increases slowly, which is good. The metric charts show an underutilized, bursty CPU. The bursts are supposedly interrupted by the disk I/O parts when the node is writing the results of a completed job. It can also be seen that the memory only starts to get consumed after 10 minutes of the run have  assed.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 3. CPU Load for the Map Reduce cluster is bursty and less than&lt;br&gt;
+50% on average (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;mr_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 4. The job only starts to consume memory when already 10 minutes&lt;br&gt;
+into the run (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s see how Spark fares.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;1.00&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.70&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;27&lt;/td&gt;
+&lt;td&gt;0.81&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;36&lt;/td&gt;
+&lt;td&gt;1.08&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;i3.xlarge&lt;/td&gt;
+&lt;td&gt;47&lt;/td&gt;
+&lt;td&gt;1.41&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;A similar trend here, however the run times are around 70% of the MapReduce version. It can be seen that the larger scale factors (SF1000 and SF3000) yielded a long runtime than expected. On the metric charts of SF100 the CPU shows full utilization, except at the end, when the results are serialized in one go and the CPU is basically idle (the snapshot of the diagram doesn&amp;rsquo;t include this part unfortunately). Spark can be seen to have used up all memory pretty fast even in case of SF100. In case of SF1000 and SF3000, the nodes are running so low on memory that most probably some of the RDDs have to be calculated multiple times (no disk level serialization was used here), which seem to be the most plausible explanation for the slowdowns experienced. In fact, the OOM errors encountered when running SF3000 supports this hypothesis even further. It was thus proposed to scale up the RAM in the instances. The CPU utilization hints that adding some extra vCPUs as well can further yield speedup.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_cpu_load.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 5. Full CPU utilization for Spark (SF100, last graph shows&lt;br&gt;
+master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;spark_sf100_mem_free.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+&lt;em&gt;Figure 6. Spark eats up memory fast (SF100, 2nd graph shows master)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;i3.2xlarge would have been the most straightforward option for scaling up the instances, however the humongous 1.9 TB disk of this image is completely unnecessary for the job. Instead the cheaper r5d.2xlarge instance was utilised, largely identical to i3.2xlarge, except it &lt;em&gt;only&lt;/em&gt; has a 300 GB SSD.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;SF&lt;/th&gt;
+&lt;th&gt;workers&lt;/th&gt;
+&lt;th&gt;Platform&lt;/th&gt;
+&lt;th&gt;Instance Type&lt;/th&gt;
+&lt;th&gt;runtime (min)&lt;/th&gt;
+&lt;th&gt;runtime * worker/SF (min)&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;100&lt;/td&gt;
+&lt;td&gt;3&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;0.48&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;300&lt;/td&gt;
+&lt;td&gt;9&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;21&lt;/td&gt;
+&lt;td&gt;0.63&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1000&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;26&lt;/td&gt;
+&lt;td&gt;0.78&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3000&lt;/td&gt;
+&lt;td&gt;90&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10000&lt;/td&gt;
+&lt;td&gt;303&lt;/td&gt;
+&lt;td&gt;Spark&lt;/td&gt;
+&lt;td&gt;r5d.2xlarge&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The last column clearly demonstrates our ability to keep the cost per scale factor unit constant.&lt;/p&gt;
+&lt;h2 id=&#34;next-steps&#34;&gt;Next steps&lt;/h2&gt;
+&lt;p&gt;The next improvement is refactoring the serializers so they use Spark&amp;rsquo;s high-level writer facilities. The most compelling benefit is that it will make the jobs fault-tolerant, as Spark maintains the integrity of the output files in case the task that writes it fails. This makes Datagen more resilient and opens up the possibility to run on less reliable hardware configuration (e.g. EC2 spot nodes on AWS) for additional cost savings. They will supposedly also yield some speedup on the same cluster configuration.&lt;/p&gt;
+&lt;p&gt;As already mentioned, the migration of the update stream serialization was ignored due to problems with the original code. Ideally, they should be implemented with the new serializers.&lt;/p&gt;
+&lt;p&gt;The Spark migration also serves as an important building block for the next generation of LDBC benchmarks. As part of extending the SNB benchmark suite, the SNB task force has recently extended Datagen with support for &lt;a href=&#34;#references&#34;&gt;generating delete operations [1]&lt;/a&gt;. The next step for the task force is to fine-tune the temporal distributions of these deletion operations to ensure that the emerging sequence of events is realistic, i.e. the emerging distribution resembles what a database system would experience when serving a real social network.&lt;/p&gt;
+&lt;h2 id=&#34;acknowledgements&#34;&gt;Acknowledgements&lt;/h2&gt;
+&lt;p&gt;This work is based upon the work of Arnau Prat, Gábor Szárnyas, Ben Steer, Jack Waudby and other LDBC contributors. Thanks for your help and feedback!&lt;/p&gt;
+&lt;h2 id=&#34;references&#34;&gt;References&lt;/h2&gt;
+&lt;p&gt;[1] &lt;a href=&#34;https://ldbcouncil.org/docs/papers/datagen-deletes-grades-nda-2020.pdf&#34;&gt;Supporting Dynamic Graphs and Temporal Entity Deletions in the LDBC Social Network Benchmark&amp;rsquo;s Data Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://www.youtube.com/watch?v=ZQOLuCOOpSI&#34;&gt;9th TUC Meeting &amp;ndash; LDBC SNB Datagen Update &amp;ndash; Arnau Prat (UPC)&lt;/a&gt; - &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://research.vu.nl/en/publications/s3g2-a-scalable-structure-correlated-social-graph-generator&#34;&gt;S3G2: a Scalable Structure-correlated Social Graph Generator&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://arxiv.org/abs/2001.02299&#34;&gt;The LDBC Social Network Benchmark&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; - &lt;a href=&#34;https://github.com/ldbc&#34;&gt;LDBC GitHub organization&lt;/a&gt;&lt;/p&gt;
+&lt;div class=&#34;footnotes&#34; role=&#34;doc-endnotes&#34;&gt;
+&lt;hr&gt;
+&lt;ol&gt;
+&lt;li id=&#34;fn:1&#34;&gt;
+&lt;p&gt;Also makes it easier to map to a tabular format thus it is a SQL friendly representation.&amp;#160;&lt;a href=&#34;#fnref:1&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:2&#34;&gt;
+&lt;p&gt;It&amp;rsquo;s hard to imagine this done declaratively in SQL.&amp;#160;&lt;a href=&#34;#fnref:2&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:3&#34;&gt;
+&lt;p&gt;Instead, multiple YARN containers have to be used if you want to parallelize on the same machine.&amp;#160;&lt;a href=&#34;#fnref:3&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:4&#34;&gt;
+&lt;p&gt;Although editors usually render these using different font styles.&amp;#160;&lt;a href=&#34;#fnref:4&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li id=&#34;fn:5&#34;&gt;
+&lt;p&gt;With the addition of deletes, entities often get inserted and deleted during the simulation (which is normal in a social network). During serialization, we check for such entities and omit them. However, we forgot to calculate this when determining the output size, which we will amend when tuning the distributions.&amp;#160;&lt;a href=&#34;#fnref:5&#34; class=&#34;footnote-backref&#34; role=&#34;doc-backlink&#34;&gt;&amp;#x21a9;&amp;#xfe0e;&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;/div&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Twelfth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/twelfth-tuc-meeting/</link>
+      <pubDate>Fri, 05 Jul 2019 08:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/twelfth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Twelfth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmarks and graph standards, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j, TigerGraph and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event on the last Friday of &lt;strong&gt;&lt;a href=&#34;https://sigmod2019.org/&#34;&gt;SIGMOD/PODS 2019&lt;/a&gt;&lt;/strong&gt; in Amsterdam, The Netherlands, in the conference venue of &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/conf_venue&#34;&gt;Beurs van Berlage&lt;/a&gt;&lt;/strong&gt;. The room is the Mendes da Silva kamer. Please check its tips for &lt;strong&gt;&lt;a href=&#34;http://sigmod2019.org/accommodation&#34;&gt;accommodation in Amsterdam&lt;/a&gt;&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Note also that at SIGMOD/PODS in Amsterdam on Sunday, June 30, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2019&#34;&gt;GRADES-NDA 2019&lt;/a&gt;, that may be of interest to our audience (this generally holds for the whole SIGMOD/PODS program, of course).&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;You need to be registered in order to get into the SIGMOD/PODS venue. Friday, July 5, is the final, workshop, day of SIGMOD/PODS, and the LDBC TUC meeting joins the other workshops for coffee and lunch.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Talk proposals can be sent to Peter Boncz&lt;/strong&gt;, who is also the local organizer. &lt;strong&gt;Please also send your slides to this email for archiving on this site.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting, there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The morning slot (08:30-10:30) is reserved for an LDBC Board Meeting, to which in principle only LDBC directors are invited (that meeting will be held in the same room).&lt;/p&gt;
+&lt;p&gt;The TUC meeting will start on Friday morning after the morning coffee break of SIGMOD/PODS 2019 (&lt;strong&gt;room: Mendes da Silva kamer&lt;/strong&gt;):&lt;/p&gt;
+&lt;p&gt;08:30-10:30 LDBC Board Meeting (non-public)&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee&lt;/p&gt;
+&lt;p&gt;11:00-12:45 Session 1: Graph Benchmarks&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:05 Welcome &amp;amp; introduction&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230404.pdf&#34;&gt;11:05-11:45 Gabor Szarnyas (BME), Benjamin Steer (QMUL), Jack Waudby (Newcastle University): Business Intelligence workload: Progress report and roadmap&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706117.pdf&#34;&gt;11:45-12:00 Frank McSherry (Materialize): Experiences implementing LDBC queries in a dataflow system&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706118.pdf&#34;&gt;12:00-12:25 Vasileios Trigonakis (Oracle): Evaluating a new distributed graph query engine with LDBC: Experiences and limitations&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706130.pdf&#34;&gt;12:25-12:45 Ahmed Musaafir (VU Amsterdam): LDBC Graphalytics&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:45-14:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00-16:05 Session 2: Graph Query Languages&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706120.pdf&#34;&gt;14:00-14:25 Juan Sequeda (Capsenta): Property Graph Schema Working Group: A progress report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706121.pdf&#34;&gt;14:25-14:50 Stefan Plantikow (Neo4j): GQL: Scope and features&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706122.pdf&#34;&gt;report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706119.pdf&#34;&gt;14:50-15:15 Vasileios Trigonakis (Oracle): Property graph extensions for the SQL standard&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706129.pdf&#34;&gt;15:15-15:40 Alin Deutsch (TigerGraph): Modern graph analytics support in GSQL, TigerGraph&amp;rsquo;s query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/112230401.pdf&#34;&gt;15:40-16:05 Jan Posiadała (Nodes and Edges, Poland): Executable semantics of graph query language&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;16:05-16:30 Coffee&lt;/p&gt;
+&lt;p&gt;16:30-17:50 Session 3: Graph System Performance&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111968258.pdf&#34;&gt;16:30-16:50 Per Fuchs (CWI): Fast, scalable WCOJ graph-pattern matching on in-memory graphs in Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706124.pdf&#34;&gt;16:50-17:10 Semih Salihoglu (University of Waterloo): Optimizing subgraph queries with a mix of tradition and modernity&lt;/a&gt; &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706116.pptx&#34;&gt;pptx&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706128.pdf&#34;&gt;17:10-17:30 Roi Lipman (RedisGraph): Evaluating Cypher queries and procedures as algebraic operations within RedisGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/twelfth-tuc-meeting/attachments/106233859/111706133.pdf&#34;&gt;17:30-17:50 Alexandru Uta (VU Amsterdam): Low-latency Spark queries on updatable data&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If there is interest, we will organize a social dinner on Friday evening for LDBC attendees.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eleventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eleventh-tuc-meeting/</link>
+      <pubDate>Fri, 08 Jun 2018 08:30:00 -0500</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eleventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC Technical User Community meetings serve to (1) learn about progress in the LDBC task forces on graph benchmark development, (2) to give feedback on these, and (3) hear about user experiences with graph data management technologies or (4) learn about new graph technologies from researchers or industry &amp;ndash; LDBC counts Oracle, IBM, Intel, Neo4j and Huawei among its members.&lt;/p&gt;
+&lt;p&gt;This TUC meeting will be a one-day event preceding the &lt;a href=&#34;https://sigmod2018.org/&#34;&gt;SIGMOD/PODS 2018&lt;/a&gt; conference in Houston, Texas (not too far away, the whole next week). Note also that at SIGMOD/PODS in Houston on Sunday 10, there is a research workshop on graph data management technology called &lt;a href=&#34;https://sites.google.com/site/gradesnda2018/&#34;&gt;GRADES-NDA 2018&lt;/a&gt; as well, so you might combine travel.&lt;/p&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt; to register.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;=&amp;gt; registration is free, but required &amp;lt;=&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz (&lt;a href=&#34;mailto:boncz@cwi.nl&#34;&gt;boncz@cwi.nl&lt;/a&gt;) and Larri (&lt;a href=&#34;mailto:larri@ac.upc.ed&#34;&gt;larri@ac.upc.edu&lt;/a&gt;). Local organizer is Juan Sequeda (&lt;a href=&#34;mailto:juanfederico@gmail.com&#34;&gt;juanfederico@gmail.com&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its interactive, business analytics and graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges and products&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:30-10:35 Peter Boncz (CWI) - introduction to the LDBC TUC meeting&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090478.pdf&#34;&gt;10:35-11:00 Juan Sequeda (Capsenta) - Announcing: gra.fo&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:00-11:30 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090466.pdf&#34;&gt;11:30-11:55 Gabor Szarnyas (BME) - LDBC benchmarks: three aspects of graph processing&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090463.pdf&#34;&gt;11:55-12:20 Peter Boncz (CWI) - G-CORE: a composable graph query language by LDBC&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090472.pdf&#34;&gt;12:20-12:45 Yinglong Xia (Huawei) - Graph Engine for Cloud AI&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:45-14:00 lunch&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090474.pdf&#34;&gt;14:00-14:25 Stefan Plantikow (Neo4j) - Composable Graph Queries and Multiple Named Graphs in Cypher for Apache Spark&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090481.pdf&#34;&gt;14:25-14:50 Oskar van Rest (Oracle) - Analyzing Stack Exchange data using Property Graph in Oracle&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99090485.pdf&#34;&gt;14:50-15:15 Brad Bebee (Amazon) - Neptune: the AWS graph management service&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:15-15:40 coffee break&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99811329.pdf&#34;&gt;15:40-16:05 Bryon Jacob (data.world): Broadening the Semantic Web&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99287041.pdf&#34;&gt;16:05-16:30 Jason Plurad (IBM) - Graph Computing with JanusGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99745793.pdf&#34;&gt;16:30-16:55 Arthur Keen (Cambridge Semantics): AnzoGraph&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;a href=&#34;http://relational.ai/&#34;&gt;16:55-17:20 Molham Aref (relational.ai)&lt;/a&gt;) - Introducing.. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eleventh-tuc-meeting/attachments/91422722/99418113.pdf&#34;&gt;relational.ai&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;18:00 - 20:00 social dinner in Austin (sponsored by Intel Corp.), Coopers BBQ, 217 Congress Ave, Austin, TX 78701&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;location&#34;&gt;Location&lt;/h3&gt;
+&lt;p&gt;The TUC will be held at the &lt;a href=&#34;https://www.cs.utexas.edu/&#34;&gt;University of Texas at Austin, Department of Computer Science&lt;/a&gt; in the &lt;a href=&#34;https://www.google.com/maps/place/The+University+of+Texas:+Department+of+Computer+Science/@30.2860955,-97.737582,18z/data=!4m5!3m4!1s0x0:0x12edecc8226b3241!8m2!3d30.2862279!4d-97.7365348&#34;&gt;Gates Dell Complex (GDC): 2317 Speedway, Austin TX, 78712&lt;/a&gt; Room: GDC 6.302&lt;/p&gt;
+&lt;p&gt;The GDC building has a North and a South building. GDC 6.302 is in the North building. When you enter the main entrance, the North building is on the left and it is served by a pair of elevators. You can take or the elevator to the 6th floor. Exit the elevator on the 6th floor. Turn left, right, left.&lt;/p&gt;
+&lt;h3 id=&#34;from-austin-to-sigmodpods-houston-on-saturday-june-9&#34;&gt;From Austin to SIGMOD/PODS (Houston) on Saturday June 9&lt;/h3&gt;
+&lt;p&gt;Many of the attendees will be going to SIGMOD/PODS which will be held in Houston.&lt;/p&gt;
+&lt;h4 id=&#34;bus&#34;&gt;Bus&lt;/h4&gt;
+&lt;p&gt;One option is to take a &lt;a href=&#34;https://us.megabus.com/journey-planner/journeys?days=1&amp;amp;concessionCount=0&amp;amp;departureDate=2018-06-09&amp;amp;destinationId=318&amp;amp;inboundOtherDisabilityCount=0&amp;amp;inboundPcaCount=0&amp;amp;inboundWheelchairSeated=0&amp;amp;nusCount=0&amp;amp;originId=320&amp;amp;otherDisabilityCount=0&amp;amp;pcaCount=0&amp;amp;totalPassengers=1&amp;amp;wheelchairSeated=0&#34;&gt;MegaBus that departs from downtown Austin and arrives at downtown Houston&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;There is a bus that departs at 12:00PM and arrives at 3:00pm. Cost is $20 (as of April 23).&lt;/p&gt;
+&lt;p&gt;If you want to spend the day in Austin, there is a bus that departs at 9:55PM and arrives at 12:50am. Cost is $5 (as of April 23).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Tenth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/tenth-tuc-meeting/</link>
+      <pubDate>Fri, 01 Sep 2017 10:30:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/tenth-tuc-meeting/</guid>
+      <description>&lt;p&gt;This will be a one-day event at the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB 2017&lt;/a&gt; conference in Munich, Germany on September 1, 2017.&lt;/p&gt;
+&lt;p&gt;Topics and activities of interest in these TUC meetings are:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Presentation on graph data management usage scenarios.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks, as well as the graph query language task force.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested to attend the event, please, contact Adrian Diaz (UPC) at &lt;a href=&#34;mailto:adiaz@ac.upc.edu&#34;&gt;adiaz@ac.upc.edu&lt;/a&gt; to register; registration is free, but required.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals are handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Intelligence and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Friday morning, with a program from 10:30-17:00&lt;/p&gt;
+&lt;p&gt;10:30-12:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87588865.pdf&#34;&gt;Peter Boncz (CWI): GraphQL task force update - the G-CORE proposal&lt;/a&gt; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868018.pptx&#34;&gt;pptx&lt;/a&gt;)&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868008.pdf&#34;&gt;Gabor Szarnyas (Budapest University of Technology and Economics Hungarian Academy of Sciences): Updates on the Social Network Benchmark BI Workload&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Alexandru Iosup, Wing Lung Ngai (VU/TU Delft): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868014.pdf&#34;&gt;LDBC Graphalytics v0.9&lt;/a&gt;, &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868013.pdf&#34;&gt;Graphalytics Global Competition and Graphalytics Custom Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:30:  lunch break&lt;/p&gt;
+&lt;p&gt;13:30-15:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868024.pdf&#34;&gt;Arnau Prat (UPC): Datasynth: Democratizing property graph generation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/86868026.pdf&#34;&gt;Marcus Paradies (SAP): SAP HANA GraphScript&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031809.pdf&#34;&gt;Yinglong Xia (Huawei): The EYWA Graph Engine in a Cloud AI Platform&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Gaétan Hains (Huawei): Cost semantics for graph queries&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;15:00-15:30:  break&lt;/p&gt;
+&lt;p&gt;15:30-17:00:  TUC session (public)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87031812.pdf&#34;&gt;Petra Selmer and Stefan Plantikow (Neo4j): openCypher Developments in 2017&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/87195650.pdf&#34;&gt;Markus Kaindl (Springer): SN SciGraph &amp;ndash; Building a Linked Data Knowledge Graph for the Scholarly Publishing Domain&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Irini Fundulaki (FORTH): The HOBBIT Link Discovery and Versioning Benchmarks&lt;/li&gt;
+&lt;li&gt;Ghislain Atemezing (Mondeca): Benchmarking Enterprise RDF stores with Publications Office Dataset&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Speakers should aim for a &lt;strong&gt;20-minute talk&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;Further:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;on Friday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; at &lt;a href=&#34;https://www.loewenbraeukeller.com/en/pub-and-beer-garden/&#34;&gt;Löwenbräukeller&lt;/a&gt;, sponsored and arranged by LDBC member Huawei (who have their European Research Center in Munich).&lt;/li&gt;
+&lt;li&gt;on Friday morning (8:30-10:30) there will be a meeting of the LDBC board of directors, but this meeting is not public.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;venue&#34;&gt;Venue&lt;/h3&gt;
+&lt;p&gt;The Technical University of Munich (TUM) is hosting that week the &lt;a href=&#34;http://www.vldb.org/2017&#34;&gt;VLDB conference&lt;/a&gt;; on the day of the TUC meeting the main conference will have finished, but there will be a number of co-located workshops ongoing, and the TUC participants will blend in with that crowd for the breaks and lunch.&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in in &lt;strong&gt;Room 2607&lt;/strong&gt; alongside the VLDB workshops that day (MATES, ADMS, DMAH, DBPL and BOSS).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;address: Technische Universität München (TUM), Arcisstraße 21, 80333 München&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.nl/maps/place/Technische+Universit%C3%A4t+M%C3%BCnchen/@48.14966,11.5656715,17z/data=!3m1!4b1!4m5!3m4!1s0x479e7261336d8c11:0x79a04d44dc5bf19d!8m2!3d48.14966!4d11.5678602?hl=en&#34;&gt;Google Maps&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920002.jpg&#34; alt=&#34;&#34;&gt;&lt;br&gt;
+&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/tenth-tuc-meeting/attachments/81920005/81920003.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Ninth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/ninth-tuc-meeting/</link>
+      <pubDate>Thu, 09 Feb 2017 15:07:18 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/ninth-tuc-meeting/</guid>
+      <description>&lt;p&gt;LDBC is pleased to announce its Ninth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; in Walldorf, Germany on February 9+10, 2017.&lt;/p&gt;
+&lt;p&gt;This will be the third TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;;&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is related to graph data management. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;In the TUC meeting there will be&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;updates on progress with LDBC benchmarks, specifically the Social Network Benchmark (SNB) and its Interactive, Business Inalytics and Graphalytics workloads.&lt;/li&gt;
+&lt;li&gt;talks by data management practitioners highlighting graph data management challenges&lt;/li&gt;
+&lt;li&gt;selected scientific talks on graph data management technology&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The meeting will start on Thursday morning, with a program from 09:00-18:00, interrupted by a lunch break.&lt;/p&gt;
+&lt;p&gt;Thursday evening (19:00-21:00) there will be a &lt;strong&gt;social dinner&lt;/strong&gt; in Heidelberg.&lt;/p&gt;
+&lt;p&gt;Friday morning the event resumes from 9:00-12:00. In the afternoon, there is a (closed) LDBC Board of Directors meeting (13:00-16:30) at the same venue.&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235334.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Address: Hauptstraße 217, 69117 Heidelberg&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Time: 19:00 / 7pm&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;(See attachments at the bottom of the page)&lt;/p&gt;
+&lt;h5 id=&#34;thursday&#34;&gt;Thursday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;Welcome and logistics - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235329.pdf&#34;&gt;Intro + state of the LDBC - Josep Lluis Larriba Pey&lt;/a&gt; (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235338.pdf&#34;&gt;LDBC Graph QL task force&lt;/a&gt; - Hannes Voigt (TU Dresden)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235335.pdf&#34;&gt;PGQL Status Update and Comparison to LDBC&amp;rsquo;s Graph QL proposals&lt;/a&gt; - Oskar van Rest (Oracle Labs)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628546.pdf&#34;&gt;Adding shortest-paths to MonetDB&lt;/a&gt; - Dean de Leo (CWI)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431939.pdf&#34;&gt;Evolving Cypher for processing multiple graphs&lt;/a&gt; - Stefan Plantikow (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235346.pdf&#34;&gt;Standardizing Graph Database Functionality - An Invitation to Collaborate&lt;/a&gt; - Jan Michels (ISO/ANSI SQL, Oracle)&amp;quot;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75235343.pdf&#34;&gt;Dgraph: Graph database for production environment&lt;/a&gt; - Tomasz Zdybal (Dgraph.io)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431945.pdf&#34;&gt;LDBC Graphalytics: Current Capabilities, Upcoming Features, and Long-Term Roadmap&lt;/a&gt; - Alexandru Iosup (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:20&lt;/td&gt;
+&lt;td&gt;LDBC Graphalytics: Demo of the Live Archive and Competition Features - Tim Hegeman (TU Delft)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:40&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431942.pdf&#34;&gt;LDBC SNB Datagen Update&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431943.pdf&#34;&gt;LDBC SNB Business Intelligence Workload: Chokepoint Analysis&lt;/a&gt; - Arnau Prat (UPC)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431947.pdf&#34;&gt;LDBC Benchmark Cost Specification&lt;/a&gt; (+discussion) - Moritz Kaufmann (TU Munich)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;14:40&lt;/td&gt;
+&lt;td&gt;coffee break&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76316673.pdf&#34;&gt;EYWA: the Distributed Graph Engine in Huawei MIND Platform&lt;/a&gt; (Yinglong Xia)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75431949.pdf&#34;&gt;Graph Processing in SAP HANA&lt;/a&gt; - Marcus Paradies (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;15:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75628563.pdf&#34;&gt;Distributed Graph Analytics with Gradoop&lt;/a&gt; - Martin Junghanns (Univ Leipzig)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152834.pdf&#34;&gt;Distributed graph flows: Cypher on Flink and Gradoop&lt;/a&gt; - Max Kießling (Neo Technology)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;16:30&lt;/td&gt;
+&lt;td&gt;closing - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:30&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h5 id=&#34;friday&#34;&gt;Friday&lt;/h5&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;start time&lt;/th&gt;
+&lt;th&gt;title – speaker&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;9:00&lt;/td&gt;
+&lt;td&gt;welcome - Peter Boncz&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:20&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152833.pdf&#34;&gt;Graph processing in obi4wan&lt;/a&gt; - Frank Smit (OBI4WAN)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;9:40&lt;/td&gt;
+&lt;td&gt;Graph problems in the space domain - Albrecht Schmidt (ESA)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:00&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/75792387.pdf&#34;&gt;Medical Ontologies for Healthcare&lt;/a&gt; - Michael Neumann (SAP)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:20&lt;/td&gt;
+&lt;td&gt;coffee&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10:50&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76447745.pdf&#34;&gt;The Train Benchmark: Cross-Technology Performance Evaluation of Continuous Model Queries&lt;/a&gt; - Gabor Szarnyas (BME)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:10&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76021761.pdf&#34;&gt;Efficient sparse matrix computations and their generalization to graph computing applications&lt;/a&gt; - Albert-Jan Yzelman (Huawei)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11:30&lt;/td&gt;
+&lt;td&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/76152837.pdf&#34;&gt;Experiments on Semantic Publishing Benchmark with large scale real news and LOD data at FactForge&lt;/a&gt; - Atanas Kyriakov (Ontotext)&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;12:00&lt;/td&gt;
+&lt;td&gt;lunch&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;13:00&lt;/td&gt;
+&lt;td&gt;LDBC Board of Directors Meeting&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;17:00&lt;/td&gt;
+&lt;td&gt;end&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h5 id=&#34;important-things-to-know&#34;&gt;&lt;strong&gt;Important things to know&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The following PDF guide provides additional information, such as recommended restaurants as well as sightseeing spots: &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;link&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;https://websmp201.sap-ag.de/~sapidp/011000358700001204882013E.pdf&#34;&gt;SAP Headquarters&lt;/a&gt; at the SAP Guesthouse Kalipeh (&lt;a href=&#34;https://www.kalipeh.com&#34;&gt;https://www.kalipeh.com&lt;/a&gt;). The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;WDF 44 / SAP Guesthouse Kalipeh&lt;br&gt;
+Dietmar-Hopp-Allee 15&lt;br&gt;
+69190 Walldorf&lt;br&gt;
+Germany&lt;/strong&gt;&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/SAP+Guesthouse+Kalipeh/@49.2951903,8.6436224,17z/data=!3m1!4b1!4m5!3m4!1s0x4797bea343a566af:0xd70698f3503ab74b!8m2!3d49.2951868!4d8.6458111&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/ninth-tuc-meeting/attachments/59277315/69042180.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h4&gt;
+&lt;h5 id=&#34;by-plane&#34;&gt;&lt;strong&gt;By plane&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;There are two airports close to SAP&amp;rsquo;s headquarter: Frankfurt Airport (FRA) and Stuttgart-Echterdingen Airport (STR). The journey from Frankfurt Airport to SAP headquarters takes about one hour by car, while it takes slightly longer from Stuttgart- Echterdingen Airport. Concerning airfare, flights to Frankfurt are usually somewhat more expensive than to Stuttgart.&lt;/p&gt;
+&lt;p&gt;When booking flights to Frankfurt, you should be aware of Frankfurt-Hahn Airport (HHN), which serves low-cost carriers but is not connected to Frankfurt Airport. Frankfurt Hahn is approximately one hour from the Frankfurt main airport by car.&lt;/p&gt;
+&lt;p&gt;The journey from Frankfurt Airport to SAP headquarters takes about one hour by car (95 kilometers, or 59 miles).&lt;/p&gt;
+&lt;p&gt;Journey time from Stuttgart-Echterdingen Airport to SAP headquarters takes about 1 hour and 15 minutes by car (115 kilometers, or 71 miles).&lt;/p&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Frankfurt Airport (FRA) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A3/Würzburg/A5/Kassel/Basel/Frankfurt.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow the A5 to &amp;ldquo;Basel/Karlsruhe/Heidelberg.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;(Should you use a navigational system which does not recognize the street name &amp;lsquo;Dietmar-Hopp-Allee&amp;rsquo; please use &amp;lsquo;Neurottstrasse&amp;rsquo; instead.)&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Traveling from Stuttgart-Echterdingen Airport (STR) to SAP Headquarters:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;To get to SAP headquarters by car, there are two possible routes to take. The first leads you via Heilbronn and the second via Karlsruhe. The route via Karlsruhe is a bit shorter yet may be more congested.&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;When leaving the airport, follow the highway symbol onto &amp;ldquo;A8/Stuttgart/B27.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Stay on A8 and follow the sign for &amp;ldquo;Karlsruhe/Heilbronn/Singen/A8.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Follow A8 to Karlsruhe.&lt;/li&gt;
+&lt;li&gt;Take exit 41 &amp;ndash; &amp;ldquo;Dreieck Karlsruhe&amp;rdquo; to merge onto A5 toward &amp;ldquo;Frankfurt/Mannheim/Karlsruhe/Landau (Pfalz).&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Take exit 39 &amp;ndash; &amp;ldquo;Walldorf/Wiesloch.&amp;rdquo;&lt;/li&gt;
+&lt;li&gt;Turn left onto B291.&lt;/li&gt;
+&lt;li&gt;Turn right onto Dietmar-Hopp-Allee.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The closest parking lot to the event location is P7 (see figure above).&lt;/p&gt;
+&lt;h5 id=&#34;by-train&#34;&gt;&lt;strong&gt;By Train&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;As the infrastructure is very well developed in Europe, and in Germany in particular, taking the train is a great and easy way of traveling. Furthermore, the trains usually run on time, so this mode of travel is very convenient, especially for a group of people on longer journeys to major cities.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;From Frankfurt Airport (FRA) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to Terminal 1, level T (see overview in Appendix).&lt;/li&gt;
+&lt;li&gt;Go to the AIRail Terminal &amp;ndash; &amp;ldquo;Fernbahnhof&amp;rdquo; (long-distance trains).&lt;/li&gt;
+&lt;li&gt;Choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP.&amp;rdquo; It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;From Stuttgart-Echterdingen Airport (STR) to SAP Headquarters&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Directions to SAP headquarters:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Go to the S-Bahn station in the airport, following the sign (station is called &amp;ldquo;Stuttgart Flughafen/Messe&amp;rdquo;).&lt;/li&gt;
+&lt;li&gt;Take train number S2 or S3 to &amp;ldquo;Stuttgart Hauptbahnhof&amp;rdquo; (main station).&lt;/li&gt;
+&lt;li&gt;From Stuttgart Hauptbahnhof choose a connection with the destination train station &amp;ldquo;Wiesloch&amp;ndash;Walldorf&amp;rdquo;.&lt;/li&gt;
+&lt;li&gt;From station &amp;ldquo;Wiesloch&amp;ndash;Walldorf,&amp;rdquo; take bus number 707 or 721 toward &amp;ldquo;Industriegebiet Walldorf, SAP&amp;rdquo;. It is a 10-minute ride to reach bus stop &amp;lsquo;SAP headquarters&amp;rsquo;.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Is Proud to Announce the New LDBC Graphalytics Benchmark Draft Specification</title>
+      <link>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</link>
+      <pubDate>Tue, 06 Sep 2016 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-is-proud-to-announce-the-new-ldbc-graphalytics-benchmark-draft-specification/</guid>
+      <description>&lt;p&gt;LDBC is proud to announce the new LDBC Graphalytics Benchmark draft specification.&lt;/p&gt;
+&lt;p&gt;LDBC Graphalytics is the first industry-grade graph data management benchmark for graph analysis platforms such as Giraph. It consists of six core algorithms, standard datasets, synthetic dataset generators, and reference outputs, enabling the objective comparison of graph analysis platforms.  It has strong industry support from Oracle, Intel, Huawei and IBM, and was tested and optimized on the best industrial and open-source systems.&lt;/p&gt;
+&lt;p&gt;Tim Hegeman of &lt;a href=&#34;https://www.tudelft.nl&#34;&gt;TU Delft&lt;/a&gt; is today presenting the technical paper describing LDBC Graphalytics at the important &lt;a href=&#34;https://www.vldb.org/conference.html&#34;&gt;VLDB&lt;/a&gt; (Very Large DataBases) conference in New Delhi, where his talk also marks the release by LDBC of Graphalytics as a benchmark draft. Practitioners are invited to read the PVLDB paper, download the software and try running it.&lt;/p&gt;
+&lt;p&gt;LDBC is eager to use any feedback for its future adoption of LDBC Graphalytics.&lt;/p&gt;
+&lt;p&gt;Learn more: [/ldbc-graphalytics](LDBC Graphalytics)&lt;/p&gt;
+&lt;p&gt;GitHub: &lt;a href=&#34;https://github.com/tudelft-atlarge/graphalytics&#34;&gt;https://github.com/tudelft-atlarge/graphalytics&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Eighth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/eighth-tuc-meeting/</link>
+      <pubDate>Wed, 22 Jun 2016 14:45:20 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/eighth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Eighth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event/eighth-tuc-meeting/attachments at &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt; in Redwood Shores facility on &lt;strong&gt;Wednesday and Thursday June 22-23, 2016&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;This will be the second TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event/eighth-tuc-meeting/attachments will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event/eighth-tuc-meeting/attachments with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify Oracle security in advance, registration requests need to be in by &lt;strong&gt;June 12&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also event/eighth-tuc-meeting/attachmentsually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#accommodation&#34;&gt;Accommodation&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;On Wednesday, lunch is provided for all attendees at 12 pm. The TUC Meeting will start at 1pm.&lt;/p&gt;
+&lt;h6 id=&#34;wednesday-22th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Wednesday, 22th of June 2016 (&lt;strong&gt;Room 203)&lt;/strong&gt;&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;(full morning: LDBC Board of Directors meeting)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;12:00 - 13:00 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:00 - 13:30 Hassan Chafi (Oracle) and Josep L. Larriba-Pey (Sparsity) Registration and welcome.&lt;/li&gt;
+&lt;li&gt;13:30 - 14:00 Peter Boncz (CWI) &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133891.pdf&#34;&gt;LDBC introduction and status update&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:00 - 15:00 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/li&gt;
+&lt;li&gt;14:00 Arnau Prat (DAMA-UPC). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133902.pdf&#34;&gt;Social Network Benchmark, Interactive workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;14:30 Tim Hegeman (TU Delft). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133893.pdf&#34;&gt;Social Network Benchmark, Analytics workload&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;15:00 - 15:30 Coffee break&lt;/li&gt;
+&lt;li&gt;15:30 - 17:00 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;15:30 Martin Zand (University of Rochester Clinical and Translational Science Institute). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133897.pdf&#34;&gt;Graphing Healthcare Networks: Data, Analytics, and Use Cases.&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:00 David Meibusch, Nathan Hawes (Oracle Labs Australia). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133901.pdf&#34;&gt;Frappé: Querying and managing evolving code dependency graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;16:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133895.pdf&#34;&gt;UniProt: challenges of a public SPARQL endpoint.&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:00 - 18:30 Graph Technologies (chair Peter Boncz)
+&lt;ul&gt;
+&lt;li&gt;17:00 Eugene I. Chong (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133904.pdf&#34;&gt;Balancing Act to improve RDF Query Performance in Oracle Database&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;17:30 Lijun Chang (University of New South Wales). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133906.pdf&#34;&gt;Efficient Subgraph Matching by Postponing Cartesian Products&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;18:00 Weining Qian (East China Normal University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133908.pdf&#34;&gt;On Statistical Characteristics of Real-Life Knowledge Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;thursday-23th-of-june-2016-room-203&#34;&gt;&lt;strong&gt;Thursday, 23th of June 2016 (Room 203)&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;08:00 - 09:00 Breakfast (provided)&lt;/li&gt;
+&lt;li&gt;09:00 - 10:00 Details on the progress of LDBC Task Forces 2 (chair Josep L. Larriba-Pey)
+&lt;ul&gt;
+&lt;li&gt;09:00 Peter Boncz (CWI). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52133896.pdf&#34;&gt;Query Language Task Force status&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;09:45 Marcus Paradies (SAP). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297729.pdf&#34;&gt;Social Network Benchmark, Business Intelligence workload&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;10:00 - 12:00 Graph Technologies and Benchmarking (chair Oskar van Rest)
+&lt;ul&gt;
+&lt;li&gt;10:00 Sergey Edunov (Facebook). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297731.pdf&#34;&gt;Generating realistic trillion-edge graphs&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;10:30 George Fletcher (TU Eindhoven). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297733.pdf&#34;&gt;An open source framework for schema-driven graph instance and graph query workload generation&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:00 Yinglong Xia (Huawei Research America): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297735.pdf&#34;&gt;An Efficient Big Graph Analytics Platform&lt;/a&gt;.&lt;/li&gt;
+&lt;li&gt;11:30 Zhe Wu (Oracle USA). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297737.pdf&#34;&gt;Bridging RDF Graph and Property Graph Data Models&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;12:00 - 13:30 Lunch (provided)&lt;/li&gt;
+&lt;li&gt;13:30 - 15:30 Graph Technologies (chair Arnau Prat)
+&lt;ul&gt;
+&lt;li&gt;13:30 Tobias Lindaaker (Neo Technology). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297740.pdf&#34;&gt;An open standard for graph queries: the Cypher contribution&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:00 Arash Termehchy (Oregon State University). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297742.pdf&#34;&gt;Toward Representation Independent Graph Querying &amp;amp; Analytics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;14:30 Jerven Bolleman (SIB Swiss Institute of Bioinformatics/UniProt consortium). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297745.pdf&#34;&gt;In the service of the federation&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;15:00 Nandish Jayaram (Pivotal). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52297747.pdf&#34;&gt;Orion: Enabling Suggestions in a Visual Query Builder for Ultra-Heterogeneous Graphs&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;15:30 - 16:00 Coffee break&lt;/li&gt;
+&lt;li&gt;16:00 - 17:15 Applications and use of Graph Technologies (chair Hassan Chafi)
+&lt;ul&gt;
+&lt;li&gt;16:00 Jans Aasman (Franz Inc.). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428806.pdf&#34;&gt;Semantic Data Lake for Healthcare&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:15 Kevin Madden (Tom Sawyer Software). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428812.pdf&#34;&gt;Dismantling Criminal Networks with Graph and Spatial Visualization and Analysis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;16:45 Juan Sequeda (Capsenta). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428810.pdf&#34;&gt;Using graph representation and semantic technology to virtually integrate and search multiple diverse data sources&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;17:15 Kevin Wilkinson (Hewlett Packard Labs). &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/52428808.pdf&#34;&gt;LDBC SNB extensions&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;17:45 - 18:15 Closing discussion&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h6 id=&#34;friday-24th-of-june-2016-room-105&#34;&gt;&lt;strong&gt;Friday, 24th of June 2016 (Room 105)&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;At the same venue: the fourth international workshop on Graph Data Management, Experience and Systems (&lt;strong&gt;GRADES16&lt;/strong&gt;).&lt;/p&gt;
+&lt;p&gt;18:30 social dinner for GRADES registrants (place to be announced)&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;22nd and 23rd June 2016&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the &lt;a href=&#34;http://www.oracle.com/technetwork/database/rdb/hqcc-dir-134199.pdf&#34;&gt;Oracle Conference Center&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Room 203 (Wed-Thu) &amp;amp; Room 105 (Fri)&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Oracle Conference Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;350 Oracle Parkway&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Redwood City, CA 94065, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://www.google.com/maps/place/Oracle+Conference+Center/@37.5322827,-122.2667034,17z/data=!3m1!4b1!4m2!3m1!1s0x808f98b5450e8ca3:0xdc75e8b1c02bbb91&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Oracle Campus map:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/eighth-tuc-meeting/attachments/40927235/40927234.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h5&gt;
+&lt;h6 id=&#34;driving-directions&#34;&gt;&lt;strong&gt;Driving directions&lt;/strong&gt;&lt;/h6&gt;
+&lt;ul&gt;
+&lt;li&gt;[Southbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 South (toward San Jose) to the Ralston Ave./Marine World Parkway exit. Take Marine World Parkway east which will loop you back over the freeway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;li&gt;[Northbound] &lt;strong&gt;-&lt;/strong&gt; Take Highway 101 North (toward San Francisco) to the Ralston Ave./Marine World Parkway exit. Take the first exit ramp onto Marine World Parkway. Make a left at the first light onto Oracle Parkway. 350 Oracle Parkway will be on the right.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h5 id=&#34;parking&#34;&gt;&lt;strong&gt;Parking&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;The Conference Center has a designated parking lot located directly across from the building. If the lot is filled there is also additional parking in any of the parking garages located near by. No parking permits are needed.&lt;/p&gt;
+&lt;h5 id=&#34;public-transport&#34;&gt;&lt;strong&gt;Public transport&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;Take the Caltrain to either San Carlos or Hillsdale and take the free Oracle shuttle from there. Get off the Oracle shuttle at 100 Oracle Parkway (second stop) and walk 5 minutes to get to the Conference Center.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Caltrain timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/weekdaytimetable.html&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Oracle Shuttle timetables: &lt;a href=&#34;http://www.caltrain.com/schedules/weekdaytimetable.html&#34;&gt;http://www.caltrain.com/schedules/Shuttles/Oracle_Shuttle.html&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;You can also take the Caltrain to Belmont and walk 23 min, instead of taking the Oracle shuttle.&lt;/p&gt;
+&lt;p&gt;Alternatively, SamTrans (San Mateo County&amp;rsquo;s Transit Agency) provides public bus service between the Millbrae BART station and Palo Alto with three stops on Oracle Parkway - one of which is directly in front of the Oracle Conference Center.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC and Apache Flink</title>
+      <link>https://ldbcouncil.org/post/ldbc-and-apache-flink/</link>
+      <pubDate>Mon, 16 Nov 2015 14:47:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-and-apache-flink/</guid>
+      <description>&lt;p&gt;Apache Flink &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; is an open source platform for distributed stream and batch data processing. Flink&amp;rsquo;s core is a streaming dataflow engine that provides data distribution, communication, and fault tolerance for distributed computations over data streams. Flink also builds batch processing on top of the streaming engine, overlaying native iteration support, managed memory, and program optimization.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://flink.apache.org/img/flink-stack-small.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Flink offers multiple APIs to process data from various data sources (e.g. HDFS, HBase, Kafka and JDBC). The DataStream and DataSet APIs allow the user to apply general-purpose data operations, like map, reduce, groupBy and join, on streams and static data respectively. In addition, Flink provides libraries for machine learning (Flink ML), graph processing (Gelly) and SQL-like operations (Table). All APIs can be used together in a single Flink program which enables the definition of powerful analytical workflows and the implementation of distributed algorithms.&lt;/p&gt;
+&lt;p&gt;The following snippet shows how a wordcount program can be expressed in Flink using the DataSet API:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; text &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromElements&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the past controls the future.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;He who controls the present controls the past.&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Tuple2&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;String&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Integer&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; wordCounts &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; text
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;flatMap&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LineSplitter&lt;span style=&#34;color:#f92672&#34;&gt;())&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// splits the line and outputs (word,1)
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tuples&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;groupBy&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;0&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;)&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// group by word
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;sum&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// sum the 1&amp;#39;s
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wordCounts&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;At the Leipzig University, we use Apache Flink as execution layer for our graph analytics platform Gradoop &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. The LDBC datagen helps us to evaluate the scalability of our algorithms and operators in a distributed execution environment. To use the generated graph data in Flink, we wrote a tool that transforms the LDBC output files into Flink data sets for further processing &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;. Using the class &lt;code&gt;LDBCToFlink&lt;/code&gt;, LDBC output files can be read directly from HDFS or from the local file system:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;hdfs:///ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; &lt;span style=&#34;color:#75715e&#34;&gt;// or &amp;#34;/path/to/social_network&amp;#34;
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The tuple classes &lt;code&gt;LDBCVertex&lt;/code&gt; and &lt;code&gt;LDBCEdge&lt;/code&gt; hold the information generated by the LDBC datagen and are created directly from its output files. During the transformation process, globally unique vertex identifiers are created based on the LDBC identifier and the vertex class. When reading edge files, source and target vertex identifiers are computed in the same way to ensure consistent linking between vertices.&lt;/p&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCVertex&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all vertices * a vertex label (e.g. &lt;code&gt;Person&lt;/code&gt;, &lt;code&gt;Comment&lt;/code&gt;) * a key-value map of properties including also multivalued properties&lt;br&gt;
+(e.g. &lt;code&gt;Person.email&lt;/code&gt;)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each &lt;code&gt;LDBCEdge&lt;/code&gt; instance contains:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;an identifier, which is unique among all edges&lt;/li&gt;
+&lt;li&gt;an edge label (e.g. &lt;code&gt;knows&lt;/code&gt;, &lt;code&gt;likes&lt;/code&gt;)&lt;/li&gt;
+&lt;li&gt;a source vertex identifier&lt;/li&gt;
+&lt;li&gt;a target vertex identifier&lt;/li&gt;
+&lt;li&gt;a key-value map of properties&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The resulting datasets can be used by the DataSet API and all libraries that are built on top of it (i.e. Flink ML, Gelly and Table). In the following example, we load the LDBC graph from HDFS, filter vertices with the label &lt;code&gt;Person&lt;/code&gt; and edges with the label &lt;code&gt;knows&lt;/code&gt; and use Gelly to compute the connected components of that subgraph. The full source code is available on GitHub &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-java&#34; data-lang=&#34;java&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; ExecutionEnvironment env &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  ExecutionEnvironment&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getExecutionEnvironment&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;final&lt;/span&gt; LDBCToFlink ldbcToFlink &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; LDBCToFlink&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;/home/s1ck/Devel/Java/ldbc_snb_datagen/social_network&amp;#34;&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter vertices with label “Person”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCVertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcVertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getVertices&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;VERTEX_CLASS_PERSON&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// filter edges with label “knows”
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;LDBCEdge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; ldbcEdges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcToFlink&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;getEdges&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;()&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;filter&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeLabelFilter&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;LDBCConstants&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;EDGE_CLASS_KNOWS&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly vertices suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; vertices &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcVertices&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; VertexInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly edges suitable for connected components
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Edge&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; edges &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ldbcEdges&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;map&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; EdgeInitializer&lt;span style=&#34;color:#f92672&#34;&gt;());&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// create Gelly graph
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;Graph&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&lt;/span&gt; g &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; Graph&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;fromDataSet&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;vertices&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; edges&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; env&lt;span style=&#34;color:#f92672&#34;&gt;);&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// run connected components on the subgraph for 10 iterations
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;DataSet&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Vertex&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; Long&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;&amp;gt;&lt;/span&gt; components &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  g&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;run&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;new&lt;/span&gt; ConnectedComponents&lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;&lt;/span&gt;Long&lt;span style=&#34;color:#f92672&#34;&gt;,&lt;/span&gt; NullValue&lt;span style=&#34;color:#f92672&#34;&gt;&amp;gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;));&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;// print the component id of the first 10 vertices
+&lt;/span&gt;&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;&lt;/span&gt;components&lt;span style=&#34;color:#f92672&#34;&gt;.&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;first&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;(&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;).&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;print&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;();&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The ldbc-flink-import tool is available on Github &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and licensed under the GNU GPLv3. If you have any questions regarding the tool please feel free to contact me on GitHub. If you find bugs or have any ideas for improvements, please create an issue or a pull request.&lt;/p&gt;
+&lt;p&gt;If you want to learn more about Apache Flink, a good starting point is the main documentation &lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt; and if you have any question feel free to ask the official mailing lists.&lt;br&gt;
+There is also a nice set of videos &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt; available from the latest Flink Forward conference.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] &lt;a href=&#34;http://flink.apache.org/&#34;&gt;http://flink.apache.org/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] &lt;a href=&#34;https://github.com/dbs-leipzig/gradoop&#34;&gt;https://github.com/dbs-leipzig/gradoop&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[3] &lt;a href=&#34;https://github.com/s1ck/ldbc-flink-import&#34;&gt;https://github.com/s1ck/ldbc-flink-import&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[4] &lt;a href=&#34;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&#34;&gt;https://gist.github.com/s1ck/b33e6a4874c15c35cd16&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[5] &lt;a href=&#34;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&#34;&gt;https://ci.apache.org/projects/flink/flink-docs-release-0.10/&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[6] &lt;a href=&#34;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&#34;&gt;https://www.youtube.com/channel/UCY8_lgiZLZErZPF47a2hXMA&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Seventh TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/seventh-tuc-meeting/</link>
+      <pubDate>Mon, 09 Nov 2015 14:17:30 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/seventh-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce its Seventh Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at &lt;a href=&#34;http://www.research.ibm.com/labs/watson&#34;&gt;IBM&amp;rsquo;s TJ Watson&lt;/a&gt; facility on &lt;strong&gt;Monday and Tuesday November 9/10, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;This will be the first TUC meeting after the finalisation of the LDBC FP7 EC funded project. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the LDBC organisation officials.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact Damaris Coll (UPC) at &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;; in order to notify IBM security in advance, registration requests need to be in by Nov 1.&lt;/p&gt;
+&lt;p&gt;In the agenda, there will be talks given by LDBC members and LDBC activities, but there will also be room for a number of short 20-minute talks by other participants. We are specifically interested in learning about new challenges in graph data management (where benchmarking would become useful) and on hearing about actual user stories and scenarios that could inspire benchmarks. Further, talks that provide feedback on existing benchmark (proposals) are very relevant. But nothing is excluded a priori if it is graph data management related. Talk proposals can be forwarded to Damaris as well and will be handled by Peter Boncz and Larri.&lt;/p&gt;
+&lt;p&gt;Further, we call on you if you or your colleagues would happen to have contacts with companies that deal with graph data management scenarios to also attend and possibly present. LDBC is always looking to expand its circle of participants in TUCs meeting, its graph technology users contacts but also eventually its membership base.&lt;/p&gt;
+&lt;p&gt;In this page, you&amp;rsquo;ll find information about the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/a&gt;&lt;br&gt;
+- &lt;a href=&#34;#getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Monday, 9th of November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:45 - 9:15 Registration and welcome (Yinglong Xia and Josep L. Larriba Pey)&lt;/p&gt;
+&lt;p&gt;9:15 - 9:30 LDBC introduction and status update (Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 - 10:30 Details on the progress of LDBC Task Forces 1 (chair Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Arnau Prat (DAMA-UPC). Social Network Benchmark, Interactive workload&lt;/p&gt;
+&lt;p&gt;10:00 Orri Erling (OpenLink Software). Social Network Benchmark, Business Intelligence workload&lt;/p&gt;
+&lt;p&gt;10:30-11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:30 Details on the progress of LDBC Task Forces 2 (chair Yinglong Xia)&lt;/p&gt;
+&lt;p&gt;11:00 Alexandru Iosup (TU Delft). Social Network Benchmark, Analytics workload.&lt;/p&gt;
+&lt;p&gt;11:30 Claudio Gutierrez (U Chile). Query Language Task Force status.&lt;/p&gt;
+&lt;p&gt;12:00 Atanas Kiryakov (Ontotext). Semantic Publishing Benchmark status&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 - 16:00 Technologies and benchmarking (chair Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:00 Molham Aref (LogicBlox). Graph Data Management with LogicBlox&lt;/p&gt;
+&lt;p&gt;14:30 Peter Kogge (Notre Dame). BFS as in Graph500 on today&amp;rsquo;s architectures&lt;/p&gt;
+&lt;p&gt;15:00 Ching-Yung Lin (IBM). Status and Demo of IBM System G&lt;/p&gt;
+&lt;p&gt;15:30-16:00 Coffee break&lt;/p&gt;
+&lt;p&gt;16:00 - 17:00 Technologies (chair Irini Fundulaki)&lt;/p&gt;
+&lt;p&gt;16:00 Kavitha Srinivas (IBM). SQLGraph: An efficient relational based property graph store&lt;/p&gt;
+&lt;p&gt;16:30 David Ediger (GeorgiaTech). STINGER&lt;/p&gt;
+&lt;p&gt;17:00 Gary King (Franz Inc.). AllegroGraph&amp;rsquo;s SPARQL implementation with Social Network Analytics abilities using Magic Properties&lt;/p&gt;
+&lt;p&gt;17:30 Manoj Kumar (IBM). Linear Algebra Formulation for Large Graph Analytics&lt;/p&gt;
+&lt;p&gt;18:00 Reihaneh Amini (Wright State University) Linked Data in the GeoLink Usecase&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Tuesday 10th November 2015&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:00 - 10:30 Technology, Applications and Benchmarking (chair Alexandru Iosup)&lt;/p&gt;
+&lt;p&gt;9:00 Philip Rathle (Neo). On openCypher&lt;/p&gt;
+&lt;p&gt;9:20 Morteza Shahriari (University of Florida). Multi-modal Probabilistic Knowledge Base for Remote Sensing Species Identification&lt;/p&gt;
+&lt;p&gt;9:50 Peter Kogge (Notre Dame). Challenging problems with Lexis Nexis Risk Solutions&lt;/p&gt;
+&lt;p&gt;10:10 Arnau Prat (DAMA-UPC). DATAGEN, status and perspectives for synthetic data generation&lt;/p&gt;
+&lt;p&gt;10:30 - 11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;11:00 - 12:45 Applications and use of Graph Technologies (chair Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:00 Hassan Chafi (Oracle). Status and characteristics of PGQL&lt;/p&gt;
+&lt;p&gt;11:20 David Guedalia (TAGIIO). Multi-tier distributed mobile applications and how they split their workload,&lt;/p&gt;
+&lt;p&gt;11:40 Guojing Cong (IBM). Algorithmic technique and architectural support for fast graph analysis&lt;/p&gt;
+&lt;p&gt;12:00 Josep Lluis Larriba-Pey. Conclusions for the TUC meeting and future perspectives&lt;/p&gt;
+&lt;p&gt;12:30 - 14:00 Lunch break&lt;/p&gt;
+&lt;p&gt;14:00 LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;9th and 10th November 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held in the IBM Thomas J Watson Research Center.&lt;br&gt;
+The address is:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;IBM Thomas J Watson Research Center&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;1101 Kitchawan Rd,&lt;/strong&gt;&lt;br&gt;
+&lt;strong&gt;Yorktown Heights, NY 10598, USA&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;If you are using a &lt;em&gt;GPS system&lt;/em&gt;, please enter &lt;strong&gt;&amp;ldquo;200 Aqueduct Road, Ossining NY, 10562&amp;rdquo;&lt;/strong&gt; for accurate directions to the lab entrance. You may also want to check the routing online.&lt;/p&gt;
+&lt;p&gt;The meeting will take place in the &lt;em&gt;Auditorium&lt;/em&gt; on November 9th, and in Meeting Room &lt;em&gt;20-043&lt;/em&gt; on November 10th.&lt;/p&gt;
+&lt;h6 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;You are highly suggested to &lt;strong&gt;rent a car&lt;/strong&gt; for your convenience, since the public transportation system does not cover this area very well. Besides, there is no hotel within walkable distance to the IBM T.J. Watson Research Center. Feel free to find carpool with other attendees. You may find car rental and hotels through &lt;a href=&#34;http://www.orbitz.com&#34;&gt;www.orbitz.com&lt;/a&gt;, or &lt;a href=&#34;http://www.expedia.com&#34;&gt;www.expedia.com&lt;/a&gt; Feel free to email &lt;a href=&#34;mailto:yxia@us.ibm.com&#34;&gt;yxia@us.ibm.com&lt;/a&gt; for any questions.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/seventh-tuc-meeting/attachments/6882333/15926330.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h6 id=&#34;getting-there&#34;&gt;&lt;strong&gt;Getting there&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Upper and Eastern New England&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 west to Route I-684, south to Exit 6, west on Route 35 to Route 100, south to Route 134, west 2.5 miles. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Haven and Connecticut Shores&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Merritt Parkway or New England Thruway (Route I-95) west to Route I-287, west to Exit 3, north on Sprain Brook Parkway, which merges into Taconic State Parkway, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New Jersey&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Take New York State Thruway (Route I-87) east across the Tappan Zee Bridge and follow signs to the Saw Mill Parkway north. Proceed north on Saw Mill River Parkway to Taconic State Parkway exit, north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Upstate New York&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route I-84 east across Newburgh-Beacon Bridge to Exit 16-S. Taconic State Parkway south to Route 134 East exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;New York City (Manhattan)&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Henry Hudson Parkway north, which becomes Saw Mill River Parkway, north to Taconic State Parkway exit. North on Taconic State Parkway to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;John F. Kennedy International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on Van Wyck Expressway to the Whitestone Expressway and continue north across the Bronx-Whitestone Bridge to the Hutchinson River Parkway north to the Cross County Parkway exit and proceed west to the Bronx River Parkway. North on the Bronx River Parkway to the Sprain Brook Parkway, which merges into the Taconic State Parkway. Continue north to Ossining/Route 134 exit. Turn right and proceed east on Route 134 several hundred yards. IBM is on the right.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;LaGuardia Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;East on the Grand Central Parkway, north on the Whitestone Expressway, and continue north across the Bronx-Whitestone Bridge. Continue with instructions from John F. Kennedy International Airport, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Newark International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;North on the New Jersey Turnpike (Route I-95). Stay in local lanes and take Exit 72 for Palisades Interstate Parkway. North on the Palisades Interstate Parkway to the New York State Thruway, Route I-87, and east across the Tappan Zee Bridge. Continue with instructions from New Jersey, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Stewart International Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Route 207 east to Route I-84, east across Newburgh-Beacon Bridge to Taconic State Parkway, south. Continue with instructions from Upstate New York, above.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Westchester County Airport&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Right on Route 120, north. Turn left where Route 120 merges with Route 133. Continue on Route 120. Cross Route 100 and continue straight on Shingle House Road to Pines Bridge Road. Turn right and proceed several hundred yards. IBM is on the left.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public Transportation&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Metropolitan Transportation Authority (MTA) train stations nearest to the Yorktown Heights location are the Croton-Harmon and White Plains stations. Taxi service is available at both locations.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Elements of Instance Matching Benchmarks: a Short Overview</title>
+      <link>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</link>
+      <pubDate>Tue, 16 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/elements-of-instance-matching-benchmarks-a-short-overview/</guid>
+      <description>&lt;p&gt;The number of datasets published in the Web of Data as part of the Linked Data Cloud is constantly increasing. The Linked Data paradigm is based on the unconstrained publication of information by different publishers, and the interlinking of web resources through “same-as” links which specify that two URIs correspond to the same real world object. In the vast number of data sources participating in the Linked Data Cloud, this information is not explicitly stated but is discovered using &lt;strong&gt;instance matching&lt;/strong&gt; techniques and tools. Instance matching is also known as &lt;strong&gt;record linkage&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;, &lt;strong&gt;duplicate detection&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, &lt;strong&gt;entity resolution&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt; and &lt;strong&gt;object identification&lt;/strong&gt; &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;For instance, a search in Geonames (&lt;a href=&#34;http://www.geonames.org/&#34;&gt;http://www.geonames.org/&lt;/a&gt;) for &amp;ldquo;Athens&amp;rdquo; would return a resource (i.e., URI) accompanied with a map of the area and information about the place; additional information for the city of Athens can be found in other datasets such as for instance DBpedia (&lt;a href=&#34;http://dbpedia.org/&#34;&gt;http://dbpedia.org/&lt;/a&gt;) or Open Government Datasets (&lt;a href=&#34;http://data.gov.gr/&#34;&gt;http://data.gov.gr/&lt;/a&gt;). To exploit all obtain all necessary information about the city of Athens we need to establish that the retrieved resources refer to the same real world object.&lt;/p&gt;
+&lt;p&gt;Web resources are published by &amp;ldquo;autonomous agents&amp;rdquo; who choose their preferred information representation or the one that best fits the application of interest. Furthermore, different representations of the same real world entity are due to data acquisition errors or different acquisition techniques used to process scientific data. Moreover, real world entities evolve and change over time, and sources need to keep track of these developments, a task that is very hard and often not possible. Finally, when integrating data from multiple sources, the process itself may add new erroneous data. Clearly, these reasons are not limited to problems that did arise in the era of Web Data, it is thus not surprising that instance matching systems have been around for several years &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[5]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;It is though essential at this point to develop, along with instance and entity matching systems, &lt;em&gt;instance matching benchmarks to determine the weak and strong points of those systems, as well as their overall quality in order to support users in deciding the system to use for their needs&lt;/em&gt;. Hence, well defined, and good quality benchmarks are important for comparing the performance of the available or under development instance matching systems. Benchmarks are used not only to inform users of the strengths and weaknesses of systems, but also to motivate developers, researchers and technology vendors to deal with the weak points of their systems and to ameliorate their performance and functionality. They are also useful for identifying the settings in which each of the systems has optimal performance. Benchmarking aims at providing an objective basis for such assessments.&lt;/p&gt;
+&lt;p&gt;An instance matching benchmark for Linked Data consists of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target dataset&lt;/em&gt; implementing a set of &lt;em&gt;test-cases&lt;/em&gt;, where each test case addresses a different kind of requirement regarding instance matching, a &lt;em&gt;ground truth&lt;/em&gt; or &lt;em&gt;gold standard&lt;/em&gt; and finally the &lt;em&gt;evaluation metrics&lt;/em&gt; used to &lt;em&gt;assess the benchmark.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Datasets are the raw material of a benchmark. A benchmark comprises of a &lt;em&gt;source&lt;/em&gt; and &lt;em&gt;target&lt;/em&gt; dataset and the objective of an instance matching system is to discover the matches of the two. Datasets are characterized by (a) their &lt;em&gt;nature&lt;/em&gt; (&lt;em&gt;real&lt;/em&gt; or &lt;em&gt;synthetic&lt;/em&gt;), (b) the &lt;em&gt;schemas/ontologies&lt;/em&gt; they use,  (c) their &lt;em&gt;domains&lt;/em&gt;,  (d) the &lt;em&gt;languages&lt;/em&gt; they are written in, and (e) the &lt;em&gt;variations/heterogeneities&lt;/em&gt; of the datasets. Real datasets are widely used in benchmarks since they offer realistic conditions for heterogeneity problems and they have realistic distributions. &lt;em&gt;Synthetic datasets&lt;/em&gt; are generated using automated data generators and  are useful because they offer fully controlled test conditions, have accurate gold standards and allow setting the focus on specific types of heterogeneity problems in a systematic manner&lt;/p&gt;
+&lt;p&gt;Datasets (and benchmarks) may contain different &lt;em&gt;kinds of variations&lt;/em&gt; that correspond to &lt;em&gt;different test cases&lt;/em&gt;. According to Ferrara et.al. &lt;a href=&#34;#references&#34;&gt;[6]&lt;/a&gt;&lt;a href=&#34;#references&#34;&gt;[7]&lt;/a&gt;, three kinds of variations exist for Linked Data, namely &lt;em&gt;data variations&lt;/em&gt;, &lt;em&gt;structural variations&lt;/em&gt; and &lt;em&gt;logical variations&lt;/em&gt;. The first refers mainly to differences due to typographical errors, differences in the employed data formats, language etc. The second refers to the differences in the structure of the employed Linked Data schemas. Finally, the third  type derives from the use of semantically rich RDF and OWL constructs that enable one to define hierarchies and equivalence of classes and properties, (in)equality of instances, complex class definitions through union and intersection among others.&lt;/p&gt;
+&lt;p&gt;The common case in real benchmarks is that the datasets to be matched contain different kinds (combinations) of variations. On the other hand, synthetic datasets may be purposefully designed to contain specific types (or combinations) of variations (e.g., only structural), or may be more general in an effort to illustrate all the common cases of discrepancies that appear in reality between individual descriptions.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;gold standard&lt;/em&gt; is considered as the “correct answer sheet” of the benchmark, and is used to judge the completeness and soundness of the result sets of the benchmarked systems. For instance matching benchmarks employing synthetic datasets, the gold standard is always automatically generated, as the errors (variations) that are added into the datasets are known and systematically created. When it comes to real datasets, the gold standard can be either manually curated or (semi-) automatically generated. In the first case, domain experts manually mark the matches between the datasets, whereas in the second, supervised and crowdsourcing techniques aid the process of finding the matches, a process that is often time consuming and error prone.&lt;/p&gt;
+&lt;p&gt;Last, an instance matching benchmark uses &lt;em&gt;evaluation metrics&lt;/em&gt; to determine and assess the systems’ output quality and performance. For instance matching tools, performance is not a critical aspect.  On the other hand, an instance matching tool should return all and only the correct answers. So, what matters most is returning the relevant matches, rather than returning them quickly. For this reason, the evaluation metrics that are dominantly employed for instance matching benchmarks are the standard &lt;em&gt;precision&lt;/em&gt;, &lt;em&gt;recall&lt;/em&gt; and &lt;em&gt;f-measure&lt;/em&gt; metrics.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Li, C., Jin, L., and Mehrotra, S. (2006) Supporting efficient record linkage for large data sets using mapping techniques. WWW 2006.&lt;/p&gt;
+&lt;p&gt;[2] Dragisic, Z., Eckert, K., Euzenat, J., Faria, D., Ferrara, A., Granada, R., Ivanova, V., Jimenez-Ruiz, E., Oskar Kempf, A., Lambrix, P., Montanelli, S., Paulheim, H., Ritze, D., Shvaiko, P., Solimando, A., Trojahn, C., Zamaza, O., and Cuenca Grau,  B. (2014) Results of the Ontology Alignment Evaluation Initiative 2014. Proc. 9th ISWC workshop on ontology matching (OM 2014).&lt;/p&gt;
+&lt;p&gt;[3] Bhattacharya, I. and Getoor, L. (2006) Entity resolution in graphs. Mining Graph Data. Wiley and Sons 2006.&lt;/p&gt;
+&lt;p&gt;[4] Noessner, J., Niepert, M., Meilicke, C., and Stuckenschmidt, H. (2010) Leveraging Terminological Structure for Object Reconciliation. In ESWC 2010.&lt;/p&gt;
+&lt;p&gt;[5] Flouris, G., Manakanatas, D., Kondylakis, H., Plexousakis, D., Antoniou, G. Ontology Change: Classification and Survey (2008) Knowledge Engineering Review (KER 2008), pages 117-152.&lt;/p&gt;
+&lt;p&gt;[6] Ferrara, A., Lorusso, D., Montanelli, S., and Varese, G. (2008) Towards a Benchmark for Instance Matching. Proc. 3th ISWC workshop on ontology matching (OM 2008).&lt;/p&gt;
+&lt;p&gt;[7] Ferrara, A., Montanelli, S., Noessner, J., and Stuckenschmidt, H. (2011) Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 3: Choke Points and Initial Run on Virtuoso</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</link>
+      <pubDate>Wed, 10 Jun 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/</guid>
+      <description>&lt;p&gt;In this post we will look at running the &lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;LDBC SNB&lt;/a&gt; on &lt;a href=&#34;https://virtuoso.openlinksw.com/&#34;&gt;Virtuoso&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;First, let&amp;rsquo;s recap what the benchmark is about:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;fairly frequent short updates, with no update contention worth mentioning&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;short random lookups&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;medium complex queries centered around a person&amp;rsquo;s social environment&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The updates exist so as to invalidate strategies that rely too heavily on precomputation. The short lookups exist for the sake of realism; after all, an online social application does lookups for the most part. The medium complex queries are to challenge the DBMS.&lt;/p&gt;
+&lt;p&gt;The DBMS challenges have to do firstly with query optimization, and secondly with execution with a lot of non-local random access patterns. Query optimization is not a requirement, &lt;em&gt;per se,&lt;/em&gt; since imperative implementations are allowed, but we will see that these are no more free of the laws of nature than the declarative ones.&lt;/p&gt;
+&lt;p&gt;The workload is arbitrarily parallel, so intra-query parallelization is not particularly useful, if also not harmful. There are latency constraints on operations which strongly encourage implementations to stay within a predictable time envelope regardless of specific query parameters. The parameters are a combination of person and date range, and sometimes tags or countries. The hardest queries have the potential to access all content created by people within 2 steps of a central person, so possibly thousands of people, times 2000 posts per person, times up to 4 tags per post. We are talking in the millions of key lookups, aiming for sub-second single-threaded execution.&lt;/p&gt;
+&lt;p&gt;The test system is the same as used in the &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1739&#34;&gt;TPC-H series&lt;/a&gt;: dual Xeon E5-2630, 2x6 cores x 2 threads, 2.3GHz, 192 GB RAM. The software is the &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics branch&lt;/a&gt; of &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack, available from www.github.com&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The dataset is the SNB 300G set, with:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;1,136,127&lt;/th&gt;
+&lt;th&gt;persons&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;125,249,604&lt;/td&gt;
+&lt;td&gt;knows edges&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;847,886,644&lt;/td&gt;
+&lt;td&gt;posts, including replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,145,893,841&lt;/td&gt;
+&lt;td&gt;tags of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1,140,226,235&lt;/td&gt;
+&lt;td&gt;likes of posts or replies&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;As an initial step, we run the benchmark as fast as it will go. We use 32 threads on the driver side for 24 hardware threads.&lt;/p&gt;
+&lt;p&gt;Below are the numerical quantities for a 400K operation run after 150K operations worth of warmup.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Duration:&lt;/strong&gt; 10:41.251&lt;br&gt;
+&lt;strong&gt;Throughput:&lt;/strong&gt; 623.71 (op/s)&lt;/p&gt;
+&lt;p&gt;The statistics that matter are detailed below, with operations ranked in order of descending client-side wait-time. All times are in milliseconds.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;% of total&lt;/th&gt;
+&lt;th&gt;total_wait&lt;/th&gt;
+&lt;th&gt;name&lt;/th&gt;
+&lt;th&gt;count&lt;/th&gt;
+&lt;th&gt;mean&lt;/th&gt;
+&lt;th&gt;min&lt;/th&gt;
+&lt;th&gt;max&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;20%&lt;/td&gt;
+&lt;td&gt;4,231,130&lt;/td&gt;
+&lt;td&gt;LdbcQuery5&lt;/td&gt;
+&lt;td&gt;656&lt;/td&gt;
+&lt;td&gt;6,449.89&lt;/td&gt;
+&lt;td&gt;245&lt;/td&gt;
+&lt;td&gt;10,311&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;11%&lt;/td&gt;
+&lt;td&gt;2,272,954&lt;/td&gt;
+&lt;td&gt;LdbcQuery8&lt;/td&gt;
+&lt;td&gt;18,354&lt;/td&gt;
+&lt;td&gt;123.84&lt;/td&gt;
+&lt;td&gt;14&lt;/td&gt;
+&lt;td&gt;2,240&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;10%&lt;/td&gt;
+&lt;td&gt;2,200,718&lt;/td&gt;
+&lt;td&gt;LdbcQuery3&lt;/td&gt;
+&lt;td&gt;388&lt;/td&gt;
+&lt;td&gt;5,671.95&lt;/td&gt;
+&lt;td&gt;468&lt;/td&gt;
+&lt;td&gt;17,368&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;7.3%&lt;/td&gt;
+&lt;td&gt;1,561,382&lt;/td&gt;
+&lt;td&gt;LdbcQuery14&lt;/td&gt;
+&lt;td&gt;1,124&lt;/td&gt;
+&lt;td&gt;1,389.13&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;5,724&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.7%&lt;/td&gt;
+&lt;td&gt;1,441,575&lt;/td&gt;
+&lt;td&gt;LdbcQuery12&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,151.42&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;3,273&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;6.5%&lt;/td&gt;
+&lt;td&gt;1,396,932&lt;/td&gt;
+&lt;td&gt;LdbcQuery10&lt;/td&gt;
+&lt;td&gt;1,252&lt;/td&gt;
+&lt;td&gt;1,115.76&lt;/td&gt;
+&lt;td&gt;13&lt;/td&gt;
+&lt;td&gt;4,743&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;5%&lt;/td&gt;
+&lt;td&gt;1,064,457&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery3PersonFriends&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.9979&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,287&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.9%&lt;/td&gt;
+&lt;td&gt;1,047,536&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery2PersonPosts&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;22.6323&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,156&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;4.1%&lt;/td&gt;
+&lt;td&gt;885,102&lt;/td&gt;
+&lt;td&gt;LdbcQuery6&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;514.295&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;5,227&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;3.3%&lt;/td&gt;
+&lt;td&gt;707,901&lt;/td&gt;
+&lt;td&gt;LdbcQuery1&lt;/td&gt;
+&lt;td&gt;2,117&lt;/td&gt;
+&lt;td&gt;334.389&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;3,467&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.4%&lt;/td&gt;
+&lt;td&gt;521,738&lt;/td&gt;
+&lt;td&gt;LdbcQuery4&lt;/td&gt;
+&lt;td&gt;1,530&lt;/td&gt;
+&lt;td&gt;341.005&lt;/td&gt;
+&lt;td&gt;49&lt;/td&gt;
+&lt;td&gt;2,774&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;2.1%&lt;/td&gt;
+&lt;td&gt;440,197&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery4MessageContent&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;9.50708&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;407,450&lt;/td&gt;
+&lt;td&gt;LdbcUpdate5AddForumMembership&lt;/td&gt;
+&lt;td&gt;14,338&lt;/td&gt;
+&lt;td&gt;28.4175&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,008&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;405,243&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery7MessageReplies&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.75217&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,112&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.9%&lt;/td&gt;
+&lt;td&gt;404,002&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery6MessageForum&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;8.72537&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,968&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.8%&lt;/td&gt;
+&lt;td&gt;387,044&lt;/td&gt;
+&lt;td&gt;LdbcUpdate3AddCommentLike&lt;/td&gt;
+&lt;td&gt;12,659&lt;/td&gt;
+&lt;td&gt;30.5746&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.7%&lt;/td&gt;
+&lt;td&gt;361,290&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery1PersonProfile&lt;/td&gt;
+&lt;td&gt;46,285&lt;/td&gt;
+&lt;td&gt;7.80577&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,015&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1.6%&lt;/td&gt;
+&lt;td&gt;334,409&lt;/td&gt;
+&lt;td&gt;LdbcShortQuery5MessageCreator&lt;/td&gt;
+&lt;td&gt;46,302&lt;/td&gt;
+&lt;td&gt;7.22234&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;2,055&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1%&lt;/td&gt;
+&lt;td&gt;220,740&lt;/td&gt;
+&lt;td&gt;LdbcQuery2&lt;/td&gt;
+&lt;td&gt;1,488&lt;/td&gt;
+&lt;td&gt;148.347&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;2,504&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.96%&lt;/td&gt;
+&lt;td&gt;205,910&lt;/td&gt;
+&lt;td&gt;LdbcQuery7&lt;/td&gt;
+&lt;td&gt;1,721&lt;/td&gt;
+&lt;td&gt;119.646&lt;/td&gt;
+&lt;td&gt;11&lt;/td&gt;
+&lt;td&gt;2,295&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.93%&lt;/td&gt;
+&lt;td&gt;198,971&lt;/td&gt;
+&lt;td&gt;LdbcUpdate2AddPostLike&lt;/td&gt;
+&lt;td&gt;5,974&lt;/td&gt;
+&lt;td&gt;33.3062&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;1,987&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.88%&lt;/td&gt;
+&lt;td&gt;189,871&lt;/td&gt;
+&lt;td&gt;LdbcQuery11&lt;/td&gt;
+&lt;td&gt;2,294&lt;/td&gt;
+&lt;td&gt;82.7685&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;2,219&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.85%&lt;/td&gt;
+&lt;td&gt;182,964&lt;/td&gt;
+&lt;td&gt;LdbcQuery13&lt;/td&gt;
+&lt;td&gt;2,898&lt;/td&gt;
+&lt;td&gt;63.1346&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,201&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.74%&lt;/td&gt;
+&lt;td&gt;158,188&lt;/td&gt;
+&lt;td&gt;LdbcQuery9&lt;/td&gt;
+&lt;td&gt;78&lt;/td&gt;
+&lt;td&gt;2,028.05&lt;/td&gt;
+&lt;td&gt;1,108&lt;/td&gt;
+&lt;td&gt;4,183&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.67%&lt;/td&gt;
+&lt;td&gt;143,457&lt;/td&gt;
+&lt;td&gt;LdbcUpdate7AddComment&lt;/td&gt;
+&lt;td&gt;3,986&lt;/td&gt;
+&lt;td&gt;35.9902&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;1,912&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.26%&lt;/td&gt;
+&lt;td&gt;54,947&lt;/td&gt;
+&lt;td&gt;LdbcUpdate8AddFriendship&lt;/td&gt;
+&lt;td&gt;571&lt;/td&gt;
+&lt;td&gt;96.2294&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;988&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.2%&lt;/td&gt;
+&lt;td&gt;43,451&lt;/td&gt;
+&lt;td&gt;LdbcUpdate6AddPost&lt;/td&gt;
+&lt;td&gt;1,386&lt;/td&gt;
+&lt;td&gt;31.3499&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;2,060&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.01%&lt;/td&gt;
+&lt;td&gt;1,848&lt;/td&gt;
+&lt;td&gt;LdbcUpdate4AddForum&lt;/td&gt;
+&lt;td&gt;103&lt;/td&gt;
+&lt;td&gt;17.9417&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;65&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;0.00%&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;LdbcUpdate1AddPerson&lt;/td&gt;
+&lt;td&gt;2&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;10&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;At this point we have in-depth knowledge of the choke points the benchmark stresses, and we can give a first assessment of whether the design meets its objectives for setting an agenda for the coming years of graph database development.&lt;/p&gt;
+&lt;p&gt;The implementation is well optimized in general but still has maybe 30% room for improvement. We note that this is based on a compressed column store. One could think that alternative data representations, like in-memory graphs of structs and pointers between them, are better for the task. This is not necessarily so; at the least, a compressed column store is much more space efficient. Space efficiency is the root of cost efficiency, since as soon as the working set is not in memory, a random access workload is badly hit.&lt;/p&gt;
+&lt;p&gt;The set of choke points (technical challenges) actually revealed by the benchmark is so far as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Cardinality estimation under heavy data skew —&lt;/em&gt; Many queries take a tag or a country as a parameter. The cardinalities associated with tags vary from 29M posts for the most common to 1 for the least common. Q6 has a common tag (in top few hundred) half the time and a random, most often very infrequent, one the rest of the time. A declarative implementation must recognize the cardinality implications from the literal and plan accordingly. An imperative one would have to count. Missing this makes Q6 take about 40% of the time instead of 4.1% when adapting.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Covering indices —&lt;/em&gt; Being able to make multi-column indices that duplicate some columns from the table often saves an entire table lookup. For example, an index onpost by author can also contain the post&amp;rsquo;s creation date.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Multi-hop graph traversal —&lt;/em&gt; Most queries access a two-hop environment starting at a person. Two queries look for shortest paths of unbounded length. For the two-hop case, it makes almost no difference whether this is done as a union or a special graph traversal operator. For shortest paths, this simply must be built into the engine; doing this client-side incurs prohibitive overheads. A bidirectional shortest path operation is a requirement for the benchmark.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Top &lt;em&gt;K&lt;/em&gt; —&lt;/em&gt; Most queries returning posts order results by descending date. Once there are at least &lt;em&gt;k&lt;/em&gt; results, anything older than the __k__th can be dropped, adding a dateselection as early as possible in the query. This interacts with vectored execution, so that starting with a short vector size more rapidly produces an initial top &lt;em&gt;k&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Late projection —&lt;/em&gt; Many queries access several columns and touch millions of rows but only return a few. The columns that are not used in sorting or selection can be retrieved only for the rows that are actually returned. This is especially useful with a column store, as this removes many large columns (e.g., text of a post) from the working set.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Materialization —&lt;/em&gt; Q14 accesses an expensive-to-compute edge weight, the number of post-reply pairs between two people. Keeping this precomputed drops Q14 from the top place. Other materialization would be possible, for example Q2 (top 20 posts by friends), but since Q2 is just 1% of the load, there is no need. One could of course argue that this should be 20x more frequent, in which case there could be a point to this.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Concurrency control —&lt;/em&gt; Read-write contention is rare, as updates are randomly spread over the database. However, some pages get read very frequently, e.g., some middle level index pages in the post table. Keeping a count of reading threads requires a mutex, and there is significant contention on this. Since the hot set can be one page, adding more mutexes does not always help. However, hash partitioning the index into many independent trees (as in the case of a cluster) helps for this. There is also contention on a mutex for assigning threads to client requests, as there are large numbers of short operations.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In subsequent posts, we will look at specific queries, what they in fact do, and what their theoretical performance limits would be. In this way we will have a precise understanding of which way SNB can steer the graph DB community.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB and Graphs Related Presentations at GRADES &#39;15</title>
+      <link>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</link>
+      <pubDate>Fri, 29 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-and-graphs-related-presentations-at-grades-15/</guid>
+      <description>&lt;p&gt;Next 31st of  May the GRADES workshop will take place in Melbourne within the ACM/SIGMOD presentation. GRADES started as an initiative of the Linked Data Benchmark Council in the SIGMOD/PODS 2013 held in New York.&lt;/p&gt;
+&lt;p&gt;Among the papers published in this edition we have &amp;ldquo;Graphalytics: A Big Data Benchmark for Graph-Processing Platforms&amp;rdquo;, which presents a new benchmark that uses the Social Network Benchmark data generator of LDBC (that can be found in &lt;a href=&#34;https://github.com/ldbc&#34;&gt;https://github.com/ldbc&lt;/a&gt;) as the base to execute the algorithms used for the benchmark, among which we have BFS, community detection and connected components. We also have &amp;ldquo;Microblogging Queries on Graph Databases: an Introspection&amp;rdquo; which benchmarks two of the most significant Graph Databases in the market, i.e. Neo4j and Sparksee using microblogging queries on top of twitter data. We can finally mention &amp;ldquo;Frappé: Querying the Linux Kernel Dependency Graph&amp;rdquo; which presents a framework for querying and visualising the dependencies of large C/C++ software systems.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://event.cwi.nl/grades2015/program.shtml&#34;&gt;Check the complete agenda.&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;Meet you in Melbourne!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 2: Modeling Choices</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</link>
+      <pubDate>Tue, 26 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;​SNB Interactive&lt;/a&gt; is the wild frontier, with very few rules. This is necessary, among other reasons, because there is no standard property graph data model, and because the contestants support a broad mix of programming models, ranging from in-process APIs to declarative query.&lt;/p&gt;
+&lt;p&gt;In the case of &lt;a href=&#34;http://dbpedia.org/resource/Virtuoso_Universal_Server&#34;&gt;Virtuoso&lt;/a&gt;, we have played with &lt;a href=&#34;http://dbpedia.org/resource/SQL&#34;&gt;SQL&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/SPARQL&#34;&gt;SPARQL&lt;/a&gt; implementations. For a fixed schema and well known workload, SQL will always win. The reason for this is that this allows to materialize multi-part indices and data orderings that make sense for the application. In other words, there is transparency into physical design. An RDF application may also have physical design by means ofstructure-aware storage but this is more complex and here we are just concerned with speed and having things work precisely as we intend.&lt;/p&gt;
+&lt;h3 id=&#34;schema-design&#34;&gt;Schema Design&lt;/h3&gt;
+&lt;p&gt;SNB has a regular schema described by a &lt;a href=&#34;https://en.wikipedia.org/wiki/Unified_Modeling_Language&#34;&gt;UML&lt;/a&gt; diagram. This has a number of relationships of which some have attributes. There are no heterogenous sets, e.g. no need for run-time typed attributes or graph edges with the same label but heterogeneous end points. Translation into SQL or RDF is straightforward. Edges with attributes, e.g. the knows relation between people would end up represented as a subject with the end points and the date since as properties. The relational implementation has a two-part primary key and the date since as a dependent column. A native property graph database would use an edge with an extra property for this, as such are typically supported.&lt;/p&gt;
+&lt;p&gt;The only table-level choice has to do with whether &lt;code&gt;posts&lt;/code&gt; and &lt;code&gt;comments&lt;/code&gt; are kept in the same or different data structures. The Virtuoso schema has a single table for both, with nullable columns for the properties that occur only in one. This makes the queries more concise. There are cases where only non-reply posts of a given author are accessed. This is supported by having two author foreign key columns each with its own index. There is a single nullable foreign key from the reply to the post/comment being replied to.&lt;/p&gt;
+&lt;p&gt;The workload has some frequent access paths that need to be supported by index. Some queries reward placing extra columns in indices. For example, a common pattern is accessing the most recent posts of an author or group of authors. There, having a composite key &lt;code&gt;of ps_creatorid&lt;/code&gt;, &lt;code&gt;ps_creationdate&lt;/code&gt;, &lt;code&gt;ps_postid&lt;/code&gt; pays off since the top-k on &lt;code&gt;creationdate&lt;/code&gt; can be pushed down into the index without needing a reference to the table.&lt;/p&gt;
+&lt;p&gt;The implementation is free to choose data types for attributes, specifically datetimes. The Virtuoso implementation adopts the practice of the &lt;a href=&#34;http://dbpedia.org/resource/DEX_(Graph_database)&#34;&gt;Sparksee&lt;/a&gt; and &lt;a href=&#34;http://dbpedia.org/resource/Neo4j&#34;&gt;Neo4J&lt;/a&gt; implementations and represents this is a count of milliseconds since epoch. This is less confusing, faster to compare and more compact than a native datetime datatype that may or may not have timezones etc. Using a built-in datetime seems to be nearly always a bad idea. A dimension table or a number for a time dimension avoids the ambiguities of a calendar or at least makes these explicit.&lt;/p&gt;
+&lt;p&gt;The benchmark allows procedurally maintaining materializations of intermediate results for use by queries as long as these are maintained transaction by transaction. For example, each person could have the 20 newest posts by immediate contacts precomputed. This would reduce Q2 &amp;ldquo;top of the wall&amp;rdquo; to a single lookup. This dows not however appear to be worthwhile. The Virtuoso implementation does do one such materialization for Q14: A connection weight is calculated for every pair of persons that know each other. This is related to the count of replies by one or the other to content generated by the other. If there does not exist a single reply in either direction, the weight is taken to be 0. This weight is precomputed after bulk load and subsequently maintained each time a reply is added. The table for this is the only row-wise structure in the schema and represents a half matrix of connected people, i.e. &lt;code&gt;person1&lt;/code&gt;, &lt;code&gt;person2&lt;/code&gt; -&amp;gt; &lt;code&gt;weight&lt;/code&gt;. &lt;code&gt;Person1&lt;/code&gt; is by convention the one with the smaller &lt;code&gt;p_personid&lt;/code&gt;. Note that comparing id&amp;rsquo;s in this way is useful but not normally supported by RDF systems. RDF would end up comparing strings of URI&amp;rsquo;s with disastrous performance implications unless an implementation specific trick were used.&lt;/p&gt;
+&lt;p&gt;In the next installment we will analyze an actual run.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>LDBC Participates in the 36th Edition of the ACM SIGMOD/PODS Conference</title>
+      <link>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</link>
+      <pubDate>Mon, 25 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/ldbc-participates-in-the-36th-edition-of-the-acm-sigmod-pods-conference/</guid>
+      <description>&lt;p&gt;LDBC is presenting two papers at the next edition of the ACM SIGMOD/PODS conference held in Melbourne from May 31st to June 4th, 2015. The annual ACM SIGMOD/PODS conference is a leading international forum for database researchers, practitioners, developers, and users to explore cutting-edge ideas and results, and to exchange techniques, tools and experiences.&lt;/p&gt;
+&lt;p&gt;On the industry track, LDBC will be presenting the &lt;em&gt;Social Network Benchmark Interactive Workload&lt;/em&gt; by Orri Erling (OpenLink Software), Alex Averbuch (Neo Technology), Josep Larriba-Pey (Sparsity Technologies), Hassan Chafi (Oracle Labs), Andrey Gubichev (TU Munich), Arnau Prat (Universitat Politècnica de Catalunya), Minh-Duc Pham (VU University Amsterdam) and Peter Boncz (CWI).&lt;/p&gt;
+&lt;p&gt;You can read more about the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark here&lt;/a&gt; and collaborate if you&amp;rsquo;re interested!&lt;/p&gt;
+&lt;p&gt;The other presentation will be at the GRADES workshop within the SIGMOD program regarding &lt;em&gt;Graphalytics: A Big Data Benchmark for Graph-Processing platforms&lt;/em&gt; by Mihai Capotă, Tim Hegeman, Alexandru Iosup (Delft University of Technology), Arnau Prat (Universitat Politècnica de Catalunya), Orri Erling (OpenLink Sotware) and Peter Boncz (CWI). We will provide more information about GRADES and this specific presentation in a following post as GRADES is part of the events organized by LDBC.&lt;/p&gt;
+&lt;p&gt;Don&amp;rsquo;t forget to check our presentations if you&amp;rsquo;re attending the SIGMOD!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Interactive Part 1: What Is SNB Interactive Really About?</title>
+      <link>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</link>
+      <pubDate>Thu, 14 May 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about/</guid>
+      <description>&lt;p&gt;This post is the first in a series of blogs analyzing the LDBC Social Network Benchmark Interactive workload. This is written from the dual perspective of participating in the benchmark design and of building the OpenLink Virtuoso implementation of same.&lt;/p&gt;
+&lt;p&gt;With two implementations of SNB interactive at four different scales, we can take a first look at what the benchmark is really about. The hallmark of a benchmark implementation is that its performance characteristics are understood and even if these do not represent the maximum of the attainable, there are no glaring mistakes and the implementation represents a reasonable best effort by those who ought to know, namely the system vendors.&lt;/p&gt;
+&lt;p&gt;The essence of a benchmark is a set of trick questions or choke points, as LDBC calls them. A number of these were planned from the start. It is then the role of experience to tell whether addressing these is really the key to winning the race. Unforeseen ones will also surface.&lt;/p&gt;
+&lt;p&gt;So far, we see that SNB confronts the implementor with choices in the following areas:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data model: Relational, RF, property graph?&lt;/li&gt;
+&lt;li&gt;Physical model, e.g. row-wise vs. column wise storage&lt;/li&gt;
+&lt;li&gt;Materialized data ordering: Sorted projections, composite keys, replicating columns in auxxiliary data structures&lt;/li&gt;
+&lt;li&gt;Maintaining precomputed, materialized intermediate results, e.g. use of materialized views, triggers&lt;/li&gt;
+&lt;li&gt;Query optimization: join order/type, interesting physical data orderings, late projection, top k, etc.&lt;/li&gt;
+&lt;li&gt;Parameters vs. literals: Sometimes different parameter values result in different optimal query plans&lt;/li&gt;
+&lt;li&gt;Predictable, uniform latency: The measurement rules stipulate the SUT must not fall behind the simulated workload&lt;/li&gt;
+&lt;li&gt;Durability - how to make data durable while maintaining steady throughput? Logging vs. checkpointing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In the process of making a benchmark implementation, one naturally encounters questions about the validity, reasonability and rationale of the benchmark definition itself. Additionally, even though the benchmark might not directly measure certain aspects of a system, making an implementation will take a system past its usual envelope and highlight some operational aspects.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Data generation - Generating a mid-size dataset takes time, e.g. 8 hours for 300G. In a cloud situation, keeping the dataset in S3 or similar is necessary, re-generating every time is not an option.&lt;/li&gt;
+&lt;li&gt;Query mix - Are the relative frequencies of the operations reasonable? What bias does this introduce?&lt;/li&gt;
+&lt;li&gt;Uniformity of parameters: Due to non-uniform data distributions in the dataset, there is easily a 100x difference between a &amp;lsquo;fast&amp;rsquo; and &amp;lsquo;slow&amp;rsquo; case of a single query template. How long does one need to run to balance these fluctuations?&lt;/li&gt;
+&lt;li&gt;Working set: Experience shows that there is a large difference between almost warm and steady state of working set. This can be a factor of 1.5 in throughput.&lt;/li&gt;
+&lt;li&gt;Are the latency constraints reasonable? In the present case, a qualifying run must have under 5% of all query executions starting over 1 second late. Each execution is scheduled beforehand and done at the intended time.  If the SUT does not keep up, it will have all available threads busy and must finish some work before accepting new work, so some queries will start late. Is this a good criterion for measuring consistency of response time? There are some obvious possibilities of abuse.&lt;/li&gt;
+&lt;li&gt;Is the benchmark easy to implement/run? Perfection is open-ended and optimization possibilities infinite, albeit with diminishing returns. Still, getting startyed should not be too hard. Since systems will be highly diverse, testing that these in fact do the same thing is important. The SNB validation suite is good for this and given publicly available reference implementations, the effort of getting started is not unreasonable.&lt;/li&gt;
+&lt;li&gt;Since a Qualifying run must meet latency constraints while going as fast as possible, setting the performance target involves trial and error. Does the tooling make this easy?&lt;/li&gt;
+&lt;li&gt;Is the durability rule reasonable? Right now, one is not required to do checkpoints but must report the time to roll forward from the last checkpoint or initial state. Incenting vendors to build faster recovery is certainly good, but we are not through with all the implications. What about redundant clusters?&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The following posts will look at the above in light of actual experience.&lt;/p&gt;
+&lt;h3 id=&#34;snb-interactive-series&#34;&gt;SNB Interactive Series&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-1-what-is-snb-interactive-really-about&#34;&gt;SNB Interactive, Part 1: What is SNB Interactive Really About?&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-2-modeling-choices&#34;&gt;SNB Interactive, Part 2: Modeling Choices&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://ldbcouncil.org/post/snb-interactive-part-3-choke-points-and-initial-run-on-virtuoso/&#34;&gt;SNB Interactive, Part 3: Choke Points and Initial Run on Virtuoso&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Why Do We Need an LDBC SNB-Specific Workload Driver?</title>
+      <link>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</link>
+      <pubDate>Tue, 21 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/why-do-we-need-an-ldbc-snb-specific-workload-driver/</guid>
+      <description>&lt;p&gt;In a previous &lt;a href=&#34;https://ldbcouncil.org/tags/driver&#34;&gt;3-part blog series&lt;/a&gt; we touched upon the difficulties of executing the LDBC SNB Interactive (SNB) workload, while achieving good performance and scalability. What we didn&amp;rsquo;t discuss is why these difficulties were unique to SNB, and what aspects of the way we perform workload execution are scientific contributions - novel solutions to previously unsolved problems. This post will highlight the differences between SNB and more traditional database benchmark workloads. Additionally, it will motivate why we chose to develop a new workload driver as part of this work, rather than using existing tooling that was developed in other database benchmarking efforts. To briefly recap, the task of the driver is to run a transactional database benchmark against large synthetic graph datasets - &amp;ldquo;graph&amp;rdquo; is the word that best captures the novelty and difficulty of this work.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Workload Execution - Traditional vs Graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Transactional graph workloads differ from traditional relational workloads in several fundamental ways, one of them being the complex dependencies that exist between queries of a graph workload.&lt;/p&gt;
+&lt;p&gt;To understand what is meant by &amp;ldquo;traditional relational workloads&amp;rdquo;, take the classical TPC-C benchmark as an example. In TPC-C Remote Terminal Emulators (emulators) are used to issue update transactions in parallel, where the transactions issued by these emulators do not depend on one another. Note, &amp;ldquo;dependency&amp;rdquo; is used here in the context of scheduling, i.e., one query is dependent on another if it can not start until the other completes. For example, a New-Order transaction does not depend on other orders from this or other users. Naturally, the results of Stock-Level transactions depend on the items that were previously sold, but in TPC-C it is not an emulator&amp;rsquo;s responsibility to enforce any such ordering. The scheduling strategy employed by TPC-C is tailored to the scenario where transactional updates do not depend on one another. In reality, one would expect to also have scheduling dependencies between transactions, e.g., checking the status of the order should only be done after the order is registered in the system.  TPC-C, however, does not do this and instead only asks for the status of the last order &lt;em&gt;for a given user&lt;/em&gt;. Furthermore, adding such dependencies to TPC-C would make scheduling only slightly more elaborate. Indeed, the Load Tester (LT) would need to make sure a New-Order transaction always precedes the read requests that check its status, but because users (and their orders) are partitioned across LTs, and orders belong to a particular user, this scheduling does not require inter-LT communication.&lt;/p&gt;
+&lt;p&gt;A significantly more difficult scheduling problem arises when we consider the SNB benchmark that models a real-world social network. Its domain includes users that form a social friendship graph and which leave posts/comments/likes on each others walls (forums). The update transactions are generated (exported as a log) by the data generator, with assigned timestamps, e.g. user 123 added post 456 to forum 789 at time T. Suppose we partition this workload by user, such that each driver gets all the updates (friendship requests, posts, comments and likes on other user&amp;rsquo;s posts etc) initiated by a given user. Now, if the benchmark is to resemble a real-world social network, the update operations represent a highly connected (and dependent) network: a user should not create comments before she joins the network, a friendship request can not be sent to a non-existent user, a comment can only be added to a post that already exists, etc. Given a user partitioning scheme, most such dependencies would cross the boundaries between driver threads/processes, because the correct execution of update operations requires that the social network is in a particular state, and that state depends on the progress of other threads/processes.&lt;/p&gt;
+&lt;p&gt;Such scheduling dependencies in the SNB workload essentially replicate the underlying graph-like shape of its dataset. That is, every time a user comments on a friend&amp;rsquo;s wall, for example, there is a dependency between two operations that is captured by an edge of the social graph. &lt;em&gt;Partitioning the workload among the LTs therefore becomes equivalent to graph partitioning, a known hard problem.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Because it&amp;rsquo;s a graph&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In short, unlike previous database benchmarking efforts, the SNB workload has necessitated a redefining of the state-of-the-art in workload execution. It is no longer sufficient to rely solely on workload partitioning to safely capture inter-query dependencies in complex database benchmark workloads. The graph-centric nature of SNB introduces new challenges, and novel mechanisms had to be developed to overcome these challenges. To the best of our knowledge, the LDBC SNB Interactive benchmark is the first benchmark that requires a non-trivial partitioning of the workload, among the benchmark drivers. In the context of workload execution, our contribution is therefore the principled design of a driver that executes dependent update operations in a performant and scalable way, across parallel/distributed LTs, while providing repeatable, vendor-independent execution of the benchmark.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Event Driven Post Generation in Datagen</title>
+      <link>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</link>
+      <pubDate>Fri, 10 Apr 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/event-driven-post-generation-in-datagen/</guid>
+      <description>&lt;p&gt;As discussed in previous posts, one of the features that makes Datagen more realistic is the fact that the activity volume of the simulated Persons is not uniform, but forms spikes. In this blog entry I want to explain more in depth how this is actually implemented inside of the generator.&lt;/p&gt;
+&lt;p&gt;First of all, I start with a few basics of how Datagen works internally. In Datagen, once the person graph has been created (persons and their relationships), the activity generation starts. Persons are divided into blocks of 10k, in the same way they are during friendship edges generation process. Then, for each person of the block, three types of forums are created:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The wall of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The albums of the person&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The groups where the person is a moderator&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will put our attention to group generation, but the same concepts apply to the other types of forums. Once a group is created, the members of the group are selected. These are selected from either the friends of the moderator, or random persons within the same block.&lt;/p&gt;
+&lt;p&gt;After assigning the members to the group, the post generation starts. We have two types of post generators, the uniform post generator and the event based post generator. Each post generator is responsible of, given a forum, generate a set of posts for the forum, whose authors are taken from the set of members of the forum. The uniform post generator distributes the dates of the generated posts uniformly in the time line (from the date of the membership until the end of the simulation time). On the other hand, the event based post generator assigns dates to posts, based on what we call “flashmob events”.&lt;/p&gt;
+&lt;p&gt;Flashmob events are generated at the beginning of the execution. Their number is predefined by a configuration parameter which is set to 30 events per month of simulation, and the time of the event is distributed uniformly along all the time line. Also, each event has a volume level assigned (between 1 and 20) following a power law distribution, which determines how relevant or important the event is, and a tag representing the concept or topic of the event. Two different events can have the same tag. For example, one of the flashmob events created for SF1 is one related to &amp;ldquo;Enrique Iglesias&amp;rdquo; tag, whose level is 11 and occurs on 29th of May of 2012 at 09:33:47.&lt;/p&gt;
+&lt;p&gt;Once the event based post generation starts for a given group, a subset of the generated flashmob events is extracted. These events must be correlated with the tag/topic of the group, and the set of selected events is restricted by the creation date of the group (in a group one cannot talk about an event previous to the creation of the group). Given this subset of events and their volume level, a cumulative probability distribution (using the events sorted by event date and their level) is computed, which is later used to determine to which event a given post is associated. Therefore, those events with a larger lavel will have a larger probability to receive posts, making their volume larger. Then, post generation starts, which can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the number of posts to generate&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Select a random member of the group that will generate the post&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Determine the event the post will be related to given the aforementioned cumulative distribution&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Assign the date of the post based on the event date&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In order to assign the date to the post, based on the date of the event the post is assigned to, we follow the following probability density, which has been extracted from &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. The shape of the probability density consists of a combination of an exponential function in the 8 hour interval around the peak, while the volume outside this interval follows a logarithmic function. The following figure shows the actual shape of the volume, centered at the date of the event.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Following the example of &amp;ldquo;Enrique Iglesias&amp;rdquo;, the following figure shows the activity volume of posts around the event as generated by Datagen.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;In this blog entry we have seen how datagen creates event driven user activity. This allows us to reproduce the heterogenous post creation density found in a real social network, where post creation is driven by real world events.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Jure Leskovec, Lars Backstrom, Jon M. Kleinberg: Meme-tracking and the dynamics of the news cycle. KDD 2009: 497-506&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sixth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/sixth-tuc-meeting/</link>
+      <pubDate>Thu, 19 Mar 2015 13:53:33 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/sixth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its Sixth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two-day event at Universitat Politècnica de Catalunya, Barcelona on &lt;strong&gt;Thursday and Friday March 19/20, 2015.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The LDBC FP7 EC funded project is reaching its finalisation, and this will be the last event sponsored directly by the project. However, tasks within LDBC will continue based on the LDBC independent organisation. The event will basically set the following aspects:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Two day event with one day devoted to User&amp;rsquo;s experiences and one day devoted to benchmarking experiences.&lt;/li&gt;
+&lt;li&gt;Presentation of the first benchmarking results for the different benchmarks.&lt;/li&gt;
+&lt;li&gt;Interaction with the new LDBC Board of Directors and the whole new LDBC organisation officials.&lt;/li&gt;
+&lt;li&gt;Pre-event with the 3rd Graph-TA workshop organised on March 18th at the same premises, with a lot of interaction and interesting research presentations.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We welcome all users of RDF and Graph technologies to attend. If you are interested, please, contact &lt;a href=&#34;mailto:damaris@ac.upc.edu&#34;&gt;damaris@ac.upc.edu&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Thursday 19th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;11:00 - 11:30 Registration, coffee break and welcome (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;11:30 - 12:00 LDBC introduction and status update (Peter Boncz) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981131.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:00 - 13:30 Technology and benchmarking (chair: Peter Boncz)&lt;/p&gt;
+&lt;p&gt;12:00 Venelin Kotsev (Ontotext). Semantic Publishing Benchmark v2.0. – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981137.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Nina Saveta (FORTH). SPIMBENCH: A Scalable, Schema-Aware, Instance Matching Benchmark for the Semantic Publishing Domain&lt;/p&gt;
+&lt;p&gt;12:50 Tomer Sagi (HP). Titan DB on LDBC SNB Interactive&lt;/p&gt;
+&lt;p&gt;13:10 Claudio Martella (VUA): Giraph and Lighthouse&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;14:30 - 16:00 Applications and use of Graph Technologies (chair: Hassan Chafi)&lt;/p&gt;
+&lt;p&gt;14:30 Jerven Bolleman (Swiss Institute of Bioinformatics): 20 billion triples in production &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981132.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 Mark Wilkinson (Universidad Politécnica de Madrid): Design principles for Linked-Data-native Semantic Web Services &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981133.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:10 Peter Haase (Metaphacts, Systap LLC): Querying the Wikidata Knowledge Graph &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981139.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Esteban Sota (GNOSS): Human Interaction with Faceted Searching Systems for big or complex graphs&lt;/p&gt;
+&lt;p&gt;18:30 - 20:00 Cultural visit Barcelona city center. Meet at Plaça Catalunya.&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner at &lt;a href=&#34;http://www.bastaix.com&#34;&gt;Bastaix Restaurant&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Friday 20th March&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;9:30 - 11:00 Technology and Benchmarking (chair: Josep L. Larriba-Pey)&lt;/p&gt;
+&lt;p&gt;9:30 Yinglong Xia (IBM): Towards Temporal Graph Management and Analytics&lt;/p&gt;
+&lt;p&gt;9:50 Alexandru Iosup (TU Delft). Graphalytics: A big data benchmark for graph-processing platforms&lt;/p&gt;
+&lt;p&gt;10:10 John Snelson (MarkLogic): Introduction to MarkLogic&lt;/p&gt;
+&lt;p&gt;10:30 Arnau Prat (UPC-Sparsity Technologies) and Alex Averbuch (Neo): Social Network Benchmark, Interactive Workload&lt;/p&gt;
+&lt;p&gt;10:50 Moritz Kaufmann. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/moritz-kaufmann-ldbc-snb-benchmark-auditing-6th-ldbc-tuc.pdf&#34;&gt;The auditing experience&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;11:15 - 11:45 Coffee break&lt;/p&gt;
+&lt;p&gt;11:45 - 12:45 Applications and use of Graph Technologies (chair: Atanas Kiryakov)&lt;/p&gt;
+&lt;p&gt;11:45 Boris Motik (Oxford University): Parallel and Incremental Materialisation of RDF/Datalog in RDFox&lt;/p&gt;
+&lt;p&gt;12:05 Andreas Both (Unister): E-Commerce and Graph-driven Applications: Experiences and Optimizations while moving to Linked Data&lt;/p&gt;
+&lt;p&gt;12:25 Smrati Gupta (CA Technologies). Modaclouds Decision Support System in multicloud environments&lt;/p&gt;
+&lt;p&gt;12:45 Peter Boncz. Conclusions for the LDBC project and future perspectives. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/6881717/6981138.pdf&#34;&gt;slides&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;13:30 - 14:30 Lunch break&lt;/p&gt;
+&lt;p&gt;15:00  LDBC Board of Directors&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h6 id=&#34;date&#34;&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;19th and 20th March 2015&lt;/p&gt;
+&lt;h6 id=&#34;venue&#34;&gt;&lt;strong&gt;Venue&lt;/strong&gt;&lt;/h6&gt;
+&lt;p&gt;The TUC meeting will be held at &amp;ldquo;Aula Master&amp;rdquo; at A3 building located inside the &amp;ldquo;Campus Nord UPC&amp;rdquo; in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h5 id=&#34;maps-and-situation&#34;&gt;&lt;strong&gt;Maps and situation&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-upc&#34;&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/h5&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;finding-the-meeting-room&#34;&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/h5&gt;
+&lt;h5 id=&#34;getting-there&#34;&gt;Getting there&lt;/h5&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to&lt;br&gt;
+the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €20 and trips to other destinations in the city cost approximately €25-30.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/sixth-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h5 id=&#34;the-locations-of-the-airport-and-the-city-centre&#34;&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/h5&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The LDBC Datagen Community Structure</title>
+      <link>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</link>
+      <pubDate>Sun, 15 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-ldbc-datagen-community-structure/</guid>
+      <description>&lt;p&gt;This blog entry is about one of the features of DATAGEN that makes it different from other synthetic graph generators that can be found in the literature: the community structure of the graph.&lt;/p&gt;
+&lt;p&gt;When generating synthetic graphs, one must not only pay attention to quantitative measures such as the number of nodes and edges, but also to other more qualitative characteristics such as the degree distribution, clustering coefficient. Real graphs, and specially social networks, have typically highly skewed degree distributions with a long tail, a moderatelly large clustering coefficient and an appreciable community structure.&lt;/p&gt;
+&lt;p&gt;The first two characteristics are deliberately modeled in DATAGEN. DATAGEN generates persons with a degree distribution that matches that observed in Facebook, and thanks to the attribute correlated edge generation process, we obtain graphs with a moderately large clustering coefficient. But what about the community structure of graphs generated with DATAGEN? The answer can be found in the paper titled “How community-like is the structure of synthetically generated graphs”, which was published in GRADES 2014 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Here we summarize the paper and its contributions and findings.&lt;/p&gt;
+&lt;p&gt;Existing synthetic graph generators such as Rmat &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; and Mag &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;, are graphs generators designed to produce graphs with long tailed distributions and large clustering coefficient, but completely ignore the fact that real graphs are structured into communities. For this reason, Lancichinetti et al. proposed LFR &lt;a href=&#34;#references&#34;&gt;[3]&lt;/a&gt;, a graph generator that did not only produced graphs with realistic high level characteristics, but enforced an appreciable community structure. This generator, has become the de facto standard for benchmarking community detection algorithms, as it does not only outputs a graph but also the communities present in that graph, hence it can be used to test the quality of a community detection algorithm.&lt;/p&gt;
+&lt;p&gt;However, no one studied if the community structure produced by LFR, was in fact realistic compared to real graphs. Even though the community structure in LFR exhibit interesting properties, such as the expected larger internal density than external, or a longtailed distribution of community sizes, they lack the noise and inhomogeneities present in a real graph. And more importantly, how does the community structure of DATAGEN compares to that exhibited in LFR and reap graphs? Is it more or less realistic? The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; set up an experiment where they analized the characteristics of the communities output by  LFR, and the groups (groups of people interested in a given topic) output by DATAGEN, and compared them to a set of real graphs with metadata. These real graphs, which can be downloaded from the Snap project website, are graphs that have recently become very popular in the field of community detection, as they contain ground truth communities extracted from their metadata. The ground truth graphs used in this experiment are shown in the following table. For more details about how this ground truth is generated, please refer to &lt;a href=&#34;#references&#34;&gt;[4]&lt;/a&gt;.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Nodes&lt;/em&gt;&lt;/th&gt;
+&lt;th&gt;&lt;em&gt;Edges&lt;/em&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Amazon&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;334863&lt;/td&gt;
+&lt;td&gt;925872&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Dblp&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;317080&lt;/td&gt;
+&lt;td&gt;1049866&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Youtube&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;1134890&lt;/td&gt;
+&lt;td&gt;2987624&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;em&gt;Livejournal&lt;/em&gt;&lt;/td&gt;
+&lt;td&gt;3997962&lt;/td&gt;
+&lt;td&gt;34681189&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors of &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; selected  a set of statistical indicators to&lt;br&gt;
+characterize the communities:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;The clustering coefficient&lt;/li&gt;
+&lt;li&gt;The triangle participation ration (TPR), which is the ratio of nodes that close at least one triangle in the community.&lt;/li&gt;
+&lt;li&gt;The bridge ratio, which is the ratio of edges whose removal disconnects the community.&lt;/li&gt;
+&lt;li&gt;The diameter&lt;/li&gt;
+&lt;li&gt;The conductance&lt;/li&gt;
+&lt;li&gt;The size&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The authors start by analyzing each community of the  ground truth graphs using the above statistical indicators and ploting the distributions of each of them. The following are the plots of the Livejournal graph. We summarize the findings of the authors regarding real graphs: + Several indicators (Clustering Coefficient, TPR and Bridge ratio) exihibit a multimodal distribution, with two peaks aht their extremes.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Many of the communities (44%) have a small clustering coefficient between 0 and 0.01. Out of them, 56% have just three vertices. On the other hand, 11% of the communities have a clustering coefficient between 0.99 and 1.0. In between, communities exhibit different values of clustering coefficients. This trend is also observed for TPR and Bridgeratio. This suggests that communities cannot be modeled using a single model. * 84% of the communities have a diameter smaller than five, suggesting that ground truth communities are small and compact * Ground truth communities are not very isolated, they have a lot of connections pointing outside of the community.&lt;/li&gt;
+&lt;li&gt;Most of the communities are small (10 or less nodes).&lt;/li&gt;
+&lt;li&gt;In general, ground truth communities are, small with a low diameter, not isolated and with different ranges of internal connectivity.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index2.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index3.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index4.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Diameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index5.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index6.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The authors performed the same experiment but for DATAGEN and LFR graphs. They generated a graph of 150k nodes, using their default parameters. In the case of LFR, they tested five different values of the mixing factor, which specifies the ratio of edges of the community pointing outside of the community, They ranged this value from 0 to 0.5. The following are the distributions for DATAGEN.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index8.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index9.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index10.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index11.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index12.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The main conclusions that can be extracted from DATAGEN can be summarized asfollows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;DATAGEN is able to reproduce the multimodal distribution observed for clustering coefficient, TPR and bridge ratio.&lt;/li&gt;
+&lt;li&gt;The central part of the clustering coefficient is biased towards the left, in a similar way as observed for the youtube and livejournal graphs.&lt;/li&gt;
+&lt;li&gt;Communities of DATAGEN graphs are not, as in real graphs, isolated, but in this case their level of isolation if significantly larger.&lt;/li&gt;
+&lt;li&gt;The diameter is small like in the real graphs.&lt;/li&gt;
+&lt;li&gt;It is significant that communities in DATAGEN graphs are closer to those observed in Youtube and Livejournal, as these are social networks like the graphs produced by DATAGEN. We see that DATAGEN is able to reproduce many of their characteristics.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the authors repeat the same experiment for LFR graphs. The following are the plots for the LFR graph with mixing ratio 0.3. From them, the authors extract the following conclusions:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;LFR graphs donot show the multimodal distribution observed in real graphs&lt;/li&gt;
+&lt;li&gt;Only the diameter shows a similar shape as in the ground truth.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index13.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index14.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index15.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index16.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index17.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index18.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;To better quanify how similar are the distribuions between the different graphs,  the authors also show the correlograms for each of the statisticsl indicators. These correlograms, contain the Spearman&amp;rsquo;s correlation coefficient between each pair of graphs for a given statistical indicator. The more blue the color, the better the correlation is. We see that DATAGEN distributions correlate very well with those observed in real graphs, specially as we commented above, with Youtube and Livejournal. On the other hand, LFR only succeds significantly in the case of the Diameter.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;th style=&#34;text-align:center&#34;&gt;&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index19.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index20.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Clustering Coefficient&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPR&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index21.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index22.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Bridge Ratio&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;TPRDiameter&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index23.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;&lt;img src=&#34;index24.png&#34; alt=&#34;&#34;&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Conductance&lt;/td&gt;
+&lt;td style=&#34;text-align:center&#34;&gt;Size&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;We see that DATAGEN is able to reproduce a realistics community structure, compared to existing graph generators. This feature, could be potentially exploited to define new benchmakrs to measure the quality of novel community detection algorithms. Stay tuned for future blog posts about his topic!&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Arnau Prat-Pérez, &lt;a href=&#34;http://dblp.uni-trier.de/pers/hd/d/Dom=iacute=nguez=Sal:David&#34;&gt;David Domínguez-Sal&lt;/a&gt;: How community-like is the structure of synthetically generated graphs? &lt;a href=&#34;http://dblp.uni-trier.de/db/conf/sigmod/grades2014.html#PratD14&#34;&gt;GRADES 2014&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;[2] Deepayan Chakrabarti, Yiping Zhan, and ChristosFaloutsos. R-mat: A recursive model for graph mining. SIAM 2014&lt;/p&gt;
+&lt;p&gt;[3] Myunghwan Kim and Jure Leskovec. Multiplicative attribute graph model of real-world networks. Internet Mathematics&lt;/p&gt;
+&lt;p&gt;[4] Andrea Lancichinetti, Santo Fortunato, and Filippo Radicchi. Benchmark graphs for testing community detection algorithms. Physical Review E 2008.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Industry Relevance of the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</link>
+      <pubDate>Tue, 03 Mar 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/industry-relevance-of-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;h3 id=&#34;publishing-and-media-businesses-are-going-through-transformation&#34;&gt;Publishing and media businesses are going through transformation&lt;/h3&gt;
+&lt;p&gt;I took this picture in June 2010 next to Union Square in San Francisco. I was smoking and wrestling my jetlag in front of Hilton. In the lobby inside the SemTech 2010 conference attendants were watching a game from the FIFA World Cup in South Africa. In the picture, the self-service newspaper stand is empty, except for one free paper. It was not long ago, in the year 2000, this stand was full. Back than the people in the Bay area were willing to pay for printed newspapers. But this is no longer true.&lt;/p&gt;
+&lt;p&gt;What’s driving this change in publishing and media?&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Widespread and instantaneous distribution of information over the Internet has turned news into somewhat of a &amp;ldquo;commodity&amp;rdquo; and few people are willing to pay for it&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The wealth of free content on YouTube and similar services spoiled the comfort of many mainstream broadcasters;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Open access publishing has limited academic publishers to sell journals and books at prices that were considered fair ten years ago.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;Alongside other changes in the industry, publishers figured out that it is critical to add value through better authoring, promotion, discoverability, delivery and presentation of precious content.&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;imagine-instant-news-in-context-imagine-personal-channels-imagine--triplestores&#34;&gt;Imagine instant news in context, Imagine personal channels, Imagine &amp;hellip; triplestores&lt;/h3&gt;
+&lt;p&gt;While plain news can be created repeatedly, premium content and services are not as easy to create. Think of an article that not only tells the new facts, but refers back to previous events and is complemented by an info-box of relevant facts. It allows one to interpret and comprehend news more effectively. This is the well-known journalistic aim to put news in context. It is also well-known that producing such news in &amp;ldquo;near real time&amp;rdquo; is difficult and expensive using legacy processes and content management technology.&lt;/p&gt;
+&lt;p&gt;Another example would be a news feed that delivers good coverage of information relevant to a narrow subject – for example a company, a story line or a region. Judging by the demand for intelligent press clipping services like &lt;a href=&#34;http://new.dowjones.com/products/factiva/&#34;&gt;Factiva&lt;/a&gt;, such channels are in demand but are not straightforward to produce with today’s technology. Despite the common perception that automated recommendations for related content and personalized news are technology no-brainers, suggesting truly relevant content is far from trivial.&lt;/p&gt;
+&lt;p&gt;Finally, if we use an example in life sciences, the ability to quickly find scientific articles discussing asthma and x-rays, while searching for respiration disorders and radiation, requires a search service that is not easy to deliver.&lt;/p&gt;
+&lt;p&gt;Many publishers have been pressed to advance their business. This, in turn, had led to quest to innovate. And semantic technology can help publishers in two fundamental ways:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;Generation of rich and &amp;ldquo;meaningful&amp;rdquo; (trying not to use &amp;ldquo;semantic&amp;rdquo; :-) metadata descriptions; 1. Dynamic retrieval of content, based on this rich metadata, enabling better delivery.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In this post I write about &amp;ldquo;semantic annotation&amp;rdquo; and how it enables application scenarios like BBC’s Dynamic Semantic Publishing (DSP). I will also present the business case behind DSP. The final part of the post is about triplestores – semantic graph database engines, used in DSP. To be more concrete I write about the Semantic Publishing Benchmark (SPB), which evaluates the performance of triplestores in DSP scenarios.&lt;/p&gt;
+&lt;h3 id=&#34;semantic-annotation-produces-rich-metadata-descriptions--the-fuel-for-semantic-publishing&#34;&gt;Semantic Annotation produces Rich Metadata Descriptions – the fuel for semantic publishing&lt;/h3&gt;
+&lt;p&gt;The most popular meaning of &amp;ldquo;semantic annotation&amp;rdquo; is the process of enrichment of text with links to (descriptions of) concepts and entities mentioned in the text. This usually means tagging either the entire document or specific parts of it with identifiers of entities. These identifiers allow one to retrieve descriptions of the entities and relations to other entities – additional structured information that fuels better search and presentation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02_semantic_repository.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;The concept of using &lt;a href=&#34;http://infosys3.elfak.ni.ac.rs/nastava/attach/SemantickiWebKurs/sdarticle.pdf&#34;&gt;text-mining for automatic semantic annotation&lt;/a&gt; of text with respect to very large datasets, such as &lt;a href=&#34;http://dbpedia.org/&#34;&gt;DBPedia&lt;/a&gt;, emerged in early 2000. In practical terms it means using such large datasets as a sort of gigantic gazetteer (name lookup tool) and the ability to disambiguate. Figuring out whether &amp;ldquo;Paris&amp;rdquo; in the text refers to the capital of France or to Paris, Texas, or to Paris Hilton is crucial in such context. Sometimes this is massively difficult – try to instruct a computer how to guess whether &amp;ldquo;Hilton&amp;rdquo; in the second sentence of this post refers to a hotel from the chain founded by her grandfather or that I had the chance to meet Paris Hilton in person on the street in San Francisco.&lt;/p&gt;
+&lt;p&gt;Today there are plenty of tools (such as the &lt;a href=&#34;https://www.ontotext.com/semantic-solutions/media-publishing/&#34;&gt;Ontotext Media and Publishing&lt;/a&gt; platform and &lt;a href=&#34;https://github.com/dbpedia-spotlight/dbpedia-spotlight/wiki&#34;&gt;DBPedia Spotlight&lt;/a&gt;) and services (such as Thomson Reuter’s &lt;a href=&#34;http://www.opencalais.com/&#34;&gt;OpenCalais&lt;/a&gt; and Ontotext’s &lt;a href=&#34;http://s4.ontotext.com&#34;&gt;S4&lt;/a&gt;) that offer automatic semantic annotation. Although text-mining cannot deliver 100% correct annotations, there are plenty of scenarios, where technology like this would revoluntionize a business. This is the case with the Dynamic Semantic Publishing scenario described below.&lt;/p&gt;
+&lt;h3 id=&#34;the-bbcs-dynamic-semantic-publishing-dsp&#34;&gt;The BBC’s Dynamic Semantic Publishing (DSP)&lt;/h3&gt;
+&lt;p&gt;Dynamic Semantic Publishing is a model for using semantic technology in media developed by a group led by John O’Donovan and Jem Rayfield at the BBC. The implementation of DSP behind BBC’s FIFA World Cup 2010 website was the first high-profile success story for usage of semantic technology in media. It is also the basis for the SPB benchmark – sufficient reasons to introduce this use case at length below.&lt;/p&gt;
+&lt;p&gt;BBC Future Media &amp;amp; Technology department have transformed the BBC relational content management model and static publishing framework to a fully dynamic semantic publishing architecture. With minimal journalistic management, media assets are being enriched with links to concepts, semantically described in a triplestore. This novel semantic approach provides improved navigation, content re-use and re-purposing through automatic aggregation and rendering of links to relevant stories. At the end of the day DSP improves the user experience on BBC’s web site.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;A high-performance dynamic semantic publishing framework facilitates the publication of automated metadata-driven web pages that are light-touch, requiring minimal journalistic management, as they automatically aggregate and render links to relevant stories&amp;rdquo;.&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;Jem Rayfield, Senior Technical Architect&lt;/a&gt;, BBC News and Knowledge&lt;/p&gt;
+&lt;p&gt;The Dynamic Semantic Publishing (DSP) architecture of the BBC curates and publishes content (e.g. articles or images) based on embedded Linked Data identifiers, ontologies and associated inference. It allows for journalists to determine levels of automation (&amp;ldquo;edited by exception&amp;rdquo;) and support semantic advertisement placement for audiences outside of the UK. The following quote explains the workflow when a new article gets into BBC’s content management system.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;In addition to the manual selective tagging process, journalist-authored content is automatically analysed against the World Cup ontology. A &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#language&#34;&gt;natural language and ontological determiner process&lt;/a&gt; automatically extracts World Cup concepts embedded within a textual representation of a story. The concepts are moderated and, again, selectively applied before publication. Moderated, automated concept analysis improves the depth, breadth and quality of metadata publishing.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;03_bbc_sport.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Journalist-published metadata is captured and made persistent for querying using the resource description framework (&lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#RDF&#34;&gt;&lt;em&gt;RDF&lt;/em&gt;&lt;/a&gt;) metadata representation and triple store technology. &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#BigOWLIM&#34;&gt;A RDF triplestore&lt;/a&gt; and &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html#SPARQL&#34;&gt;SPARQL&lt;/a&gt; approach was chosen over and above traditional relational database technologies due to the requirements for interpretation of metadata with respect to an ontological domain model. The high level goal is that the domain ontology allows for intelligent mapping of journalist assets to concepts and queries. The chosen triplestore provides reasoning following the forward-chaining model and thus implied inferred statements are automatically derived from the explicitly applied journalist metadata concepts. For example, if a journalist selects and applies the single concept &amp;ldquo;Frank Lampard&amp;rdquo;, then the framework infers and applies concepts such as &amp;ldquo;England Squad&amp;rdquo;, &amp;ldquo;Group C&amp;rdquo; and &amp;ldquo;FIFA World Cup 2010&amp;rdquo; &amp;hellip;&amp;rdquo;&lt;/em&gt; &amp;ndash; Jem Rayfield&lt;/p&gt;
+&lt;p&gt;One can consider each of the &amp;ldquo;aggregation pages&amp;rdquo; of BBC as a sort of feed or channel serving content related to a specific topic. If you take this perspective, with its World Cup 2010 website BBC was able to provide more than 700 thematic channels.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&amp;ldquo;The World Cup site is a large site with over 700 aggregation pages (called index pages) designed to lead you on to the thousands of story pages and content&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;…&lt;/strong&gt;&lt;strong&gt;&lt;em&gt;we are not publishing pages, but publishing content&lt;/em&gt;&lt;/strong&gt; &lt;em&gt;as assets which are then organized by the metadata dynamically into pages, but could be re-organized into any format we want much more easily than we could before.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;04_content_tagging.png&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;… The index pages are published automatically. This process is what assures us of the highest quality output, but still &lt;strong&gt;save large amounts of time&lt;/strong&gt; in managing the site and &lt;strong&gt;makes it possible for us to efficiently run so many pages&lt;/strong&gt; for the World Cup.&amp;rdquo;&lt;/em&gt; &amp;ndash; &lt;a href=&#34;http://www.bbc.co.uk/blogs/bbcinternet/2010/07/the_world_cup_and_a_call_to_ac.html&#34;&gt;John O&amp;rsquo;Donovan, Chief Technical Architect, BBC Future Media &amp;amp; Technology&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;To get a real feeling about the load of the triplestore behind BBC&amp;rsquo;s World Cup web site, here are some statistics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;800+ aggregation pages (Player, Team, Group, etc.), generated through SPARQL queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average unique page requests/day: 2 million;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Average &lt;strong&gt;SPARQL queries/day: 1 million;&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;100s repository updates/inserts per minute&lt;/strong&gt; with OWL 2 RL reasoning;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Multi data center that is fully resilient, clustered 6 node triplestore.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;the-semantic-publishing-benchmark&#34;&gt;The Semantic Publishing Benchmark&lt;/h3&gt;
+&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the BBC Dynamic Semantic Publishing scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volumes of read requests (SPARQL queries collecting recent content and data to generate web pages on a specific subject, e.g. Frank Lampard).&lt;/p&gt;
+&lt;p&gt;SPB simulates a setup for media that deals with large volumes of streaming content, e.g. articles, pictures, videos. This content is being enriched with metadata that describes it through links to reference knowledge:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Reference knowledge:&lt;/em&gt; taxonomies and databases that include relevant concepts, entities and factual information (e.g. sport statistics);&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Metadata&lt;/em&gt; for each individual piece of content allows publishers to efficiently produce live streams of content relevant to specific subjects.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;In this scenario the triplestore holds both reference knowledge and metadata. The main interactions with the repository are of two types:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Aggregation queries&lt;/em&gt; retrieve content according to various criteria. There are two sets (mixes) of aggregation queries. The basic one includes interactive queries that involve retrieval of concrete pieces of content, as well as aggregation functions, geo-spatial and full-text search constraints. The analytical query mix includes analytical queries, faceted search and drill-down queries;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Updates&lt;/em&gt;, adding new metadata or updating the reference knowledge. It is important that such updates should immediately impact the results of the aggregation queries. Imagine a fan checking the page for Frank Lampard right after he scored a goal – she will be very disappointed to see out of date statistics there.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPB v.1.0 directly reproduces the DSP setup at the BBC. The reference dataset consists of BBC Ontologies (Core, Sport, News), BBC datasets (list of F1 teams, MPs, etc.) and an excerpt from &lt;a href=&#34;http://www.geonames.org/&#34;&gt;Geonames&lt;/a&gt; for the UK. The benchmark is packed with metadata generator that allows one to set up experiments at different scales. The metadata generator produces 19 statements per Creative Work (BBC’s slang for all sorts of media assets). The standard scale factor is 50 million statements.&lt;/p&gt;
+&lt;p&gt;A more technical introduction to SPB can be found in this &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. Results from experiments with SPB on different hardware configurations, including AWS instances, are available in this &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;post&lt;/a&gt;. An interesting discovery is that given the current state of the technology (particularly the GraphDB v.6.1 engine) and today’s cloud infrastructure, the load of BBC’s World Cup 2010 website can be handled at AWS by a cluster that costs only $81/day.&lt;/p&gt;
+&lt;p&gt;Despite the fact that SPB v.1.0 follows closely the usage scenario for triplestores in BBC’s DSP incarnations, it is relevant to a wide range of media and publishing scenarios, where large volumes of &amp;ldquo;fast flowing&amp;rdquo; content need to be &amp;ldquo;dispatched&amp;rdquo; to serve various information needs of a huge number of consumers. The main challenges can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;The Triplestore is used as operational database serving a massive number of read queries (hundreds of queries per second) in parallel with tens of update transactions per second. Transactions need to be handled instantly and in a reliable and consistent manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Reasoning is needed to map content descriptions to queries in a flexible manner;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;There are specific requirements, such as efficient handling of full-text search, geo-spatial and temporal constraints.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;spb-v20--steeper-for-the-engines-closer-to-the-publishers&#34;&gt;SPB v.2.0 – steeper for the engines, closer to the publishers&lt;/h3&gt;
+&lt;p&gt;We are in the final testing of the new version 2.0 of SPB. The benchmark has evolved to allow for retrieval of semantically relevant content in a more advanced manner and at the same time to demonstrate how triplestores can offer simplified and more efficient querying.&lt;/p&gt;
+&lt;p&gt;The major changes in SPB v.2.0 can be summarized as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Much bigger reference dataset: from 170 thousand to 22 million statements. Now it includes GeoNames data about all of Europe (around 7 million statements) and DBPedia data about companies, people and events (14 million statements). This way we can simulate media archives described against datasets with good global coverage for specific types of objects. Such large reference sets also provide a better testing ground for experiments with very large content archives – think of 50 million documents (1 billion statements) or more;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Better interconnected reference data: more than 5 million links between entities, including 500,000 owl:sameAs links between DBPedia and Geonames descriptions. The latter evaluates the capabilities of the engine to deal with data coming from multiple sources, which use different identifiers for one and the same entity;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Retrieval of relevant content through links in the reference data, including inferred ones. To this end it is important than SPB v.2.0 involves much more comprehensive inference, particularly with respect to transitive closure of parent-company and geographic nesting chains.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>OWL-Empowered SPARQL Query Optimization</title>
+      <link>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</link>
+      <pubDate>Wed, 18 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/owl-empowered-sparql-query-optimization/</guid>
+      <description>&lt;p&gt;The Linked Data paradigm has become the prominent enabler for sharing huge volumes of data using Semantic Web technologies, and has created novel challenges for non-relational data management systems, such as RDF and graph engines. Efficient data access through queries is perhaps the most important data management task, and is enabled through query optimization techniques, which amount to the discovery of optimal or close to optimal execution plans for a given query.&lt;/p&gt;
+&lt;p&gt;In this post, we propose a different approach to query optimization, which is meant to complement (rather than replace) the standard optimization methodologies for SPARQL queries. Our approach is based on the use of schema information, encoded using OWL constructs, which often accompany Linked Data.&lt;/p&gt;
+&lt;p&gt;OWL adopts the Open World Assumption and hence OWL axioms are perceived primarily to infer new knowledge. Nevertheless, ontology designers consider OWL as an expressive schema language used to express constraints for validating the datasets, hence following the Closed World Assumption when interpreting OWL ontologies. Such constraints include disjointness/equivalence of classes/properties, cardinality constraints, domain and range restrictions for properties and others.&lt;/p&gt;
+&lt;p&gt;This richness of information carried over by OWL axioms can be the basis for the development of schema-aware techniques that will allow significant improvements in the performance of existing RDF query engines when used in tandem with data statistics or even other heuristics based on patterns found in SPARQL queries. As a simple example, a cardinality constraint at the schema level can provide a hint on the proper join ordering, even if data statistics are missing or incomplete.&lt;/p&gt;
+&lt;p&gt;The aim of this post is to show that the richness of information carried over by OWL axioms under the Close World Assumption can be the basis for the development of schema-aware optimization techniques that will allow considerable improvement for query processing. To attain this objective, we discuss a small set of interesting cases of OWL axioms; a full list can be found &lt;a href=&#34;LDBC_D4.4.2_final.pdf&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;schema-based-optimization-techniques&#34;&gt;Schema-Based Optimization Techniques&lt;/h3&gt;
+&lt;p&gt;Here we provide some examples of queries, which, when combined with specific schema constraints expressed in OWL, can help the optimizer in formulating the (near to) optimal query plans.&lt;/p&gt;
+&lt;p&gt;A simple first case is the case of constraint violation. Consider the query below, which returns all instances of class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt; which are fillers of a specific property &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt;. If the underlying schema contains the information that the range of &lt;code&gt;&amp;lt;P&amp;gt;&lt;/code&gt; is class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt;, and that class &lt;code&gt;&amp;lt;B&amp;gt;&lt;/code&gt; is disjoint from class &lt;code&gt;&amp;lt;A&amp;gt;&lt;/code&gt;, then this query should return the empty result, with no further evaluation (assuming that the constraints associated with the schema are satisfied by the data). An optimizer that takes into account schema information should return an empty result in constant time instead of trying to optimize or evaluate the large star join.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?v 
+WHERE { ?v rdf : type &amp;lt;A&amp;gt; .   
+        ?u &amp;lt;P&amp;gt; ?v . ?u &amp;lt;P&amp;gt; ?v1 .   
+        ?u &amp;lt;P1 &amp;gt; ?v2 . ?u &amp;lt;P2 &amp;gt; ?v3 .   
+        ?u &amp;lt;P3 &amp;gt; ?v4 . ?u &amp;lt;P4 &amp;gt; ?v5}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Schema-aware optimizers could also prune the search space by eliminating results that are known a priori not to be in the answer set of a query. The query above is an extreme such example (where all potential results are pruned), but other cases are possible, such as the case of the query below, where all subclasses of class &lt;code&gt;&amp;lt;A1&amp;gt;&lt;/code&gt; can immediately be identified as not being in the answer set.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?c
+WHERE { ?x rdf: type ?c . ?x &amp;lt;P&amp;gt; ?y . 
+        FILTER NOT EXISTS \{ ?x rdf: type &amp;lt;A1 &amp;gt; }}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Another category of schema-empowered optimizations has to do with improved selectivity estimation. In this respect, knowledge about the cardinality (minimum cardinality, maximum cardinality, exact cardinality, functionality) of a property can be exploited to formulate better query plans, even if data statistics are incomplete, missing or erroneous.&lt;/p&gt;
+&lt;p&gt;Similarly, taking into account class hierarchies, or the definition of classes/properties via set theoretic constructs (union, intersection) at the schema level, can provide valuable information on the selectivity of certain triple patterns, thus facilitating the process of query optimization. Similar effects can be achieved using information about properties (functionality, transitivity, symmetry etc).&lt;/p&gt;
+&lt;p&gt;As an example of these patterns, consider the query below, where class &lt;code&gt;&amp;lt;C&amp;gt;&lt;/code&gt; is defined as the intersection of classes &lt;code&gt;&amp;lt;C1&amp;gt;&lt;/code&gt;,&lt;code&gt; &amp;lt;C2&amp;gt;&lt;/code&gt;. Thus, the triple pattern &lt;code&gt;(?x rdf:type &amp;lt;C&amp;gt;)&lt;/code&gt; is more selective than &lt;code&gt;(?y rdf:type &amp;lt;C1&amp;gt;)&lt;/code&gt; and &lt;code&gt;(?z rdf:type &amp;lt;C2&amp;gt;)&lt;/code&gt; and this should be immediately recognizable by the optimizer, without having to resort to cost estimations. This example shows also how unnecessary triple patterns can be pruned from a query to reduce the number of necessary joins. Figure 1 illustrates the query plan obtained when the OWL intersectionOf construct is used.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?x 
+WHERE { ?x rdf: type &amp;lt;C&amp;gt; . ?x &amp;lt;P1 &amp;gt; ?y . 
+        ?y rdf : type &amp;lt;C1 &amp;gt; . ?y &amp;lt;P2 &amp;gt; ?z . ?z rdf : type &amp;lt;C2 &amp;gt; }
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;&lt;img src=&#34;owl_constraints.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Schema information can also be used by the query optimizer to rewrite SPARQL queries to equivalent ones that are found in a form for which already known optimization techniques are easily applicable. For example, the query below could easily be transformed into a classical star-join query if we know (from the schema) that property &lt;code&gt;P4&lt;/code&gt; is a symmetric property.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;SELECT ?y ?y1 ?y2 ?y3 
+WHERE { ?x &amp;lt;P1 &amp;gt; ?y . ?x &amp;lt;P2 &amp;gt; ?y1 . 
+        ?x &amp;lt;P3 &amp;gt; ?y2 . ?y3 &amp;lt;P4 &amp;gt; ?x }
+&lt;/code&gt;&lt;/pre&gt;&lt;h3 id=&#34;conclusion&#34;&gt;Conclusion&lt;/h3&gt;
+&lt;p&gt;In this post we argued that OWL-empowered optimization techniques can be beneficial for SPARQL query optimization when used in tandem with standard heuristics based on statistics. We provided some examples which showed the power of such optimizations in various cases, namely:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Cases where the search space can be pruned due to the schema and the associated constraints; an extreme special sub-case is the identification of queries that violate schema constraints and thus produce no results.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can help in the estimation of triple pattern selectivity, even if statistics are incomplete or missing.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can identify redundant triple patterns that do not affect the result and can be safely eliminated from the query.&lt;/li&gt;
+&lt;li&gt;Cases where the schema can be used for rewriting a query in an equivalent form that would facilitate optimization using well-known optimization techniques.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;This list is by no means complete, as further cases can be identified by optimizers. Our aim in this post was not to provide a complete listing, but to demonstrate the potential of the idea in various directions.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Person Activity Subgraph Features in LDBC DATAGEN</title>
+      <link>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</link>
+      <pubDate>Wed, 04 Feb 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/person-activity-subgraph-features-in-ldbc-datagen/</guid>
+      <description>&lt;p&gt;When talking about DATAGEN and other graph generators with social network characteristics, our attention is typically borrowed by the friendship subgraph and/or its structure. However, a social graph is more than a bunch of people being connected by friendship relations, but has a lot more of other things is worth to look at. With a quick view to commercial social networks like Facebook, Twitter or Google+, one can easily identify a lot of other elements such as text images or even video assets. More importantly, all these elements form other subgraphs within the social network! For example, the person activity subgraph is composed by posts and their replies in the different forums/groups in a social network, and has a tree-like structure connecting people through their message interactions.&lt;/p&gt;
+&lt;p&gt;When looking at the LDBC Social Network Benchmark (SNB) and its interactive workload, one realizes that these other subgraphs, and especially the person activity subgraph, play a role even more important than that played by the friendship subgraph. Just two numbers that illustrate this importance: 11 out of the 14 interactive workload queries needs traversing parts of the person activity subgraph, and about 80% of all the generated data by DATAGEN belongs to this subgraph. As a consequence, a lot of effort has been devoted to make sure that the person activity subgraph is realistic enough to fulfill the needs of the benchmark. In the rest of this post, I will discuss some of the features implemented in DATAGEN that make the person activity subgraph interesting.&lt;/p&gt;
+&lt;h3 id=&#34;reaslistic-message-content&#34;&gt;Reaslistic Message Content&lt;/h3&gt;
+&lt;p&gt;Messages&amp;rsquo; content in DATAGEN is not random, but contains snippets of text extracted from Dbpedia talking about the tags the message has. Furthermore, not all messages are the same size, depending on whether they are posts or replies to them. For example, the size of a post is selected uniformly between a minimum and a maximum, but also, there is a small probability that the content is very large (about 2000 characters). In the case of commets (replies to posts), there is a probability of 0.66 to be very short (“ok”, “good”, “cool”, “thanks”, etc.). Moreover, in real forum conversations, it is tipical to see conversations evolving from one topic to another. For this reason, there is a probability that the tags of comments replying posts to change during the flow of the conversation, moving from post&amp;rsquo;s tags to other related or randomly selected tags.&lt;/p&gt;
+&lt;h3 id=&#34;non-uniform-activity-levels&#34;&gt;Non uniform activity levels&lt;/h3&gt;
+&lt;p&gt;In a real social network, not all the members show the same level of activity. Some people post messages more sporadically than others, whose activity is significantly higher. DATAGEN reproduces this phenomena by correlating the activity level with the amount of friends the person has. That is, the larger the amount of friends a person has, the larger the number of posts it creates, and also, the larger the number of groups it belongs to.&lt;/p&gt;
+&lt;h3 id=&#34;time-correlated-post-and-comment-generation&#34;&gt;Time correlated post and comment generation&lt;/h3&gt;
+&lt;p&gt;In a real social network, user activity is driven by real world events such as sport events, elections or natural disasters, just to cite a few of them. For this reason, we observe spikes of activity around these events, where the amount of messages created increases significantly during a short period of time, reaching a maximum and then decreasing. DATAGEN emulates this behavior by generating a set of real world events about specific tags. Then, when dates of posts and comments are generated, these events are taken into account in such a way that posts and comments are clustered around them. Also not all the events are equally relevant, thus having spikes larger than others. The shape of the activity is modeled following the model described in &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;. Furthermore, in order to represent the more normal and uniform person activity levels, we also generate uniformly distributed messages along the time line. The following figure shows the user activity volume along the time line.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;1.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;As we see, the timeline contains spikes of activity, instead of being uniform. Note that the generally increasing volume activity is due to the fact that more people is added to the social network as time advances.&lt;/p&gt;
+&lt;p&gt;In this post we have reviewed several interesting characteristics of the person activity generation process in DATAGEN. Stay tuned for future blog posts about this topic.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Leskovec, J., Backstrom, L., &amp;amp; Kleinberg, J. (2009, June). Meme-tracking and the dynamics of the news cycle. In &lt;em&gt;Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining&lt;/em&gt; (pp. 497-506). ACM.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 2: Tracking Dependencies Between Queries</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</link>
+      <pubDate>Fri, 23 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries/</guid>
+      <description>&lt;p&gt;The &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;SNB Driver part 1&lt;/a&gt; post introduced, broadly, the challenges faced when developing a workload driver for the LDBC SNB benchmark. In this blog we&amp;rsquo;ll drill down deeper into the details of what it means to execute &amp;ldquo;dependent queries&amp;rdquo; during benchmark execution, and how this is handled in the driver. First of all, as many driver-specific terms will be used, below is a listing of their definitions. There is no need to read them in detail, it is just there to serve as a point of reference.&lt;/p&gt;
+&lt;h3 id=&#34;definitions&#34;&gt;Definitions&lt;/h3&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Simulation Time (ST)&lt;/em&gt;: notion of time created by data generator. All time stamps in the generated data set are in simulation time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Real Time (RT)&lt;/em&gt;: wall clock time&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Time Compression Ratio&lt;/em&gt;: function that maps simulation time to real time, e.g., an offset in combination with a compression ratio. It is a static value, set in driver configuration. Real Time Ratio is reported along with benchmark results, allowing others to recreate the same benchmark&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Operation&lt;/em&gt;: read and/or write&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependencies&lt;/em&gt;: operations in this set introduce dependencies in the workload. That is, for every operation in this set there exists at least one other operation (in Dependents) that can not be executed until this operation has been processed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependents&lt;/em&gt;: operations in this set are dependent on at least one other operation (in Dependencies) in the workload&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time (DueT)&lt;/em&gt;: point in simulation time at which the execution of an operation should be initiated.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependent Time (DepT)&lt;/em&gt;: in addition to Due Time, every operation in Dependents also has a Dependent Time, which corresponds to the Due Time of the operation that it depends on. Dependent Time is always before Due Time. For operations with multiple dependencies Dependent Time is the maximum Due Time of all the operations it depends on.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Safe Time (SafeT)&lt;/em&gt;: time duration.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;when two operations have a necessary order in time (i.e., dependency) there is at least a SafeT interval between them&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;SafeT is the minimum duration between the Dependency Time and Due Time of any operations in Dependents&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;​&lt;em&gt;Operation Stream&lt;/em&gt;: sequence of operations ordered by Due Time (dependent operations must separated by at least SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Initiated Operations&lt;/em&gt;: operations that have started executing but not yet finished&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Local Completion Time (per driver)&lt;/em&gt;: point in simulation time behind which there are no uncompleted operationsLocal Completion Time = min(min(Initiated Operations), max(Completed Operations))&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Global Completion Time (GCT)&lt;/em&gt;: minimum completion time of all drivers. Once GCT has advanced to the Dependent Time of some operation that operation is safe to execute, i.e., the operations it depends on have all completed executing. Global Completion Time = min(Local Completion Time)​&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Window (Window)&lt;/em&gt;: a timespan within which all operations can be safely executed&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;All operations satisfying window.startTime &amp;lt;= operation.DueT &amp;lt; window.endTime may be executed&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Within a window no restrictions on operation ordering or operation execution time are enforced, driver has a freedom of choosing an arbitrary scheduling strategy inside the window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;To ensure that execution order respects dependencies between operations, window size is bounded by SafeT, such that: 0 &amp;lt; window.duration &amp;lt;= SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Window duration is fixed, per operation stream; this is to simplify scheduling and make benchmark runs repeatable&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Before any operations within a window can start executing it is required that: GCT &amp;gt;= window.startTime - (SafeT - window.duration)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;All operations within a window must initiate and complete between window start and end times: window.startTime &amp;lt;= operation.initiate &amp;lt; window.endTime and window.startTime &amp;lt;= operation.complete &amp;lt; window.endTime&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Dependency Mode&lt;/em&gt;: defines dependencies, constraints on operation execution order&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Execution Mode&lt;/em&gt;: defines how the runtime should execute operations of a given type&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;tracking-dependencies&#34;&gt;Tracking Dependencies&lt;/h3&gt;
+&lt;p&gt;Now, the fun part, making sure dependent operations are executed in the correct order.&lt;/p&gt;
+&lt;p&gt;Consider that every operation in a workload belongs to none, one, or both of the following sets: Dependencies and Dependents. As mentioned, the driver uses operation time stamps (Due Times) to ensure that dependencies are maintained. It keeps track of the latest point in time behind which every operation has completed. That is, every operation (i.e., dependency) with a Due Time lower or equal to this time is guaranteed to have completed execution. It does this by maintaining a monotonically increasing variable called Global Completion Time (GCT).&lt;/p&gt;
+&lt;p&gt;Logically, every time the driver (via a database connector) begins execution of an operation from Dependencies that operation is added to Initiated Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started executing but not yet finished.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Then, upon completion, the operation is removed from Initiated Operations and added to Completed Operations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the set of operations that have started and finished executing.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these sets, each driver process maintains its own view of GCT in the following way. Local progress is monitored and managed using a variable called Local Completion Time (LCT):&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the point in time behind which there are no uncompleted operations. No operation in Initiated Operations has a lower or equal Due Time and no operation in Completed Operations has an equal or higher Due Time.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;LCT is periodically sent to all other driver processes, which all then (locally) set their view of GCT to the minimum LCT of all driver processes. At this point the driver has two, of the necessary three (third covered shortly), pieces of information required for knowing when to execute an operation:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;Due Time&lt;/em&gt;: point in time at which an operation should be executed, assuming all preconditions (e.g., dependencies) have been fulfilled&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;em&gt;GCT&lt;/em&gt;: every operation (from Dependencies) with a Due Time before this point in time has completed execution&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;However, with only GCT to track dependencies the driver has no way of knowing when it is safe to execute any particular dependent operation. What GCT communicates is that all dependencies up to some point in time have completed, but whether or not the dependencies for any particular operation are within these completed operations is unknown. The driver would have to wait until GCT has passed the Due Time (because Dependency Time is always lower) of an operation before that operation could be safely executed, which would result in the undesirable outcome of every operation missing its Due Time. The required information is which particular operation in Dependencies does any operation in Dependents depend on. More specifically, the Due Time of this operation. This is referred to as Dependent Time:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;in addition to Due Time, every operation in Dependents also has (read: must have) a Dependent Time, which corresponds to the latest Due Time of all the operations it depends on. Once GCT has advanced beyond the Dependent Time of an operation that operation is safe to execute.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Using these three mechanisms (Due Time, GCT, and Dependent Time) the driver is able to execute operations, while ensuring their dependencies are satisfied beforehand.&lt;/p&gt;
+&lt;h3 id=&#34;scalable-execution-in-the-presence-of-dependencies&#34;&gt;Scalable execution in the Presence of Dependencies&lt;/h3&gt;
+&lt;p&gt;The mechanisms introduced in part 1 guarantee that dependency constraints are not violated, but in doing so they unavoidably introduce overhead of communication/synchronization between driver threads/processes. To minimize the negative effects that synchronization has on scalability an additional Execution Mode was introduced (more about Execution Modes will be discussed shortly): Windowed Execution. Windowed Execution has two design goals:&lt;/p&gt;
+&lt;p&gt;a) make the generated load less &amp;lsquo;bursty&amp;rsquo;&lt;/p&gt;
+&lt;p&gt;b) allow the driver to &amp;lsquo;scale&amp;rsquo;, so when the driver is given more resources (CPUs, servers, etc.) it is able to generate more load.&lt;/p&gt;
+&lt;p&gt;In the context of Windowed Execution, operations are executed in groups (Windows), where operations are grouped according to their Due Time. Every Window has a Start Time, a Duration, and an End Time, and Windows contain only those operations that have a Due Time between Window.startTime and Window.endTime. Logically, all operations within a Window are executed at the same time, some time within the Window. No guaranty is made regarding exactly when, or in what order, an operation will execute within its Window.&lt;/p&gt;
+&lt;p&gt;The reasons this approach is correct are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Operations belonging to the Dependencies set are never executed in this manner - the Due Times of Dependencies operations are never modified as this would affect how dependencies are tracked&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;The minimum duration between the Dependency Time and Due Time of any operation in Dependents is known (can be calculated by scanning through workload once), this duration is referred to as Safe Time (SafeT)&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;A window does not start executing until the dependencies of all its operations have been fulfilled. This is ensured by enforcing that window execution does not start until&lt;/p&gt;
+&lt;p&gt;GCT &amp;gt;= window.startTime - (SafeT - window.duration) = window.endTime - SafeT; that is, the duration between GCT and the end of the window is no longer than SafeT&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The advantages of such an execution mode are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;As no guarantees are made regarding time or order of operation execution within a Window, GCT no longer needs to be read before the execution of every operation, only before the execution of every window&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Then, as GCT is read less frequently, it follows that it does not need to be communicated between driver processes as frequently. There is no need or benefit to communicating GCT protocol message more frequently than approximately Window.duration, the side effect of which is reduced network traffic&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Further, by making no guarantees regarding the order of execution the driver is free to reschedule operations (within Window bounds). The advantage being that operations can be rearranged in such a way as to reduce unwanted bursts of load during execution, which could otherwise occur while synchronizing GCT during demanding workloads. For example, a uniform scheduler may modify operation Due Times to be uniformly distributed across the Window timespan, to &amp;lsquo;smoothen&amp;rsquo; the load within a Window.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;As with any system, there are trade-offs to this design, particularly regarding Window.duration. The main trade-off is that between &amp;lsquo;workload resolution&amp;rsquo; and scalability. Increasing Window.duration reduces synchronization but also reduces the resolution at which the workload definition is followed. That is, the generated workload becomes less like the workload definition. However, as this is both bounded and configurable, it is not a major concern. This issue is illustrated in Figure 1, where the same stream of events is split into two different workloads based on different size of the Window. The workload with Window size 5 (on the right) has better resolution, especially for the &amp;lsquo;bursty&amp;rsquo; part of the event stream.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;window-scheduling.png&#34; alt=&#34;image&#34;&gt;&lt;br&gt;
+Figure 1. Window scheduling&lt;/p&gt;
+&lt;p&gt;This design also trades a small amount of repeatability for scalability: as there are no timing or ordering guarantees within a window, two executions of the same window are not guaranteed to be equivalent - &amp;lsquo;what happens in the window stays in the window&amp;rsquo;. Despite sacrificing this repeatability, the results of operations do not change. No dependency-altering operations occur during the execution of a Window, therefore results for all queries should be equivalent between two executions of the same workload, there is no effect on the expected result for any given operation.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 3: Workload Execution Putting It All Together</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</link>
+      <pubDate>Tue, 20 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-3-workload-execution-putting-it-all-together/</guid>
+      <description>&lt;p&gt;Up until now we have introduced the &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-1&#34;&gt;challenges faced when executing the LDBC SNB benchmark&lt;/a&gt;, as well as explained &lt;a href=&#34;https://ldbcouncil.org/post/snb-driver-part-2-tracking-dependencies-between-queries&#34;&gt;how some of these are overcome&lt;/a&gt;. With the foundations laid, we can now explain precisely how operations are executed.&lt;/p&gt;
+&lt;p&gt;Based on the dependencies certain operations have, and on the granularity of parallelism we wish to achieve while executing them, we assign a Dependency Mode and an Execution Mode to every operation type. Using these classifications the driver runtime then knows how each operation should be executed. These modes, as well as what they mean to the driver runtime, are described below.&lt;/p&gt;
+&lt;h3 id=&#34;dependency-modes&#34;&gt;Dependency Modes&lt;/h3&gt;
+&lt;p&gt;While executing a workload the driver treats operations differently, depending on their Dependency Mode. In the previous section operations were categorized by whether or not they are in the sets Dependencies and/or Dependents.&lt;/p&gt;
+&lt;p&gt;Another way of communicating the same categorization is by assigning a Dependency Mode to operations - every operation type generated by a workload definition must be assigned to exactly one Dependency Mode. Dependency modes define dependencies, constraints on operation execution order. The driver supports a number of different Dependency Modes: None, Read Only, Write Only, Read Write. During workload execution, operations of each type are treated as follows:&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• None&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: do nothing – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (NO): operations do not introduce dependencies with other operations (i.e., the correct execution of no other operation depends on these operations to have completed executing)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: wait for GCT &amp;gt;= operation.DepTime – After Execution: do nothing&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Write Only&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (NO): operation execution does not depend on GCT to have advanced sufficiently (i.e., correct execution of these operations does not depend on any other operations to have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Read Write&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Depended On (YES): operations do introduce dependencies with other operations (i.e., the correct execution of certain other operations requires that these operations to have completed executing, i.e., to advance GCT)&lt;/p&gt;
+&lt;p&gt;Dependent On (YES): operation execution does depend on GCT to have advanced sufficiently (i.e., correct execution of these operations requires that certain operations have completed execution)&lt;/p&gt;
+&lt;p&gt;– Prior Execution: add operation to Initiated Operations, wait for GCT &amp;lt; operation.DepT&lt;/p&gt;
+&lt;p&gt;– After Execution: remove operation from Initiated Operations, add operation to Completed Operations&lt;/p&gt;
+&lt;h3 id=&#34;execution-modes&#34;&gt;Execution Modes&lt;/h3&gt;
+&lt;p&gt;Execution Modes relate to how operations are scheduled, when they are executed, and what their failure conditions are. Each operation type in a workload definition must be assigned to exactly one Execution Mode. The driver supports a number of different Execution Modes: Asynchronous, Synchronous, Partially Synchronous. It splits a single workload operation stream into multiple streams, zero or more steams per Execution Mode. During workload execution, operations from each of these streams are treated as follows.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Asynchronous&lt;/strong&gt;: operations are executed individually, when their Due Time arrives.&lt;/p&gt;
+&lt;p&gt;Motivation: This is the default execution mode, it executes operations as true to the workload definition as possible.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler – Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: unbounded&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: unbounded&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Synchronous&lt;/strong&gt;: operations are executed individually, sequentially, in blocking manner.&lt;/p&gt;
+&lt;p&gt;Motivation: Some dependencies are difficult to capture efficiently with SafeT and GCT alone. For example, social applications often support conversations via posts and likes, where likes depend on the existence of posts. Furthermore, posts and likes also depend on the existence of the users that make them. However, users are created at a lower frequency than posts and likes, and it can be assumed they do not immediately start creating content. As such, a reasonably long SafeT can be used between the creation of a user and the first time that user creates posts or likes. Conversely, posts are often replied to and/or liked soon after their creation, meaning a short SafeT would be necessary to maintain the ordering dependency. Consequently, maintaining the dependencies related to conversations would require a short SafeT, and hence a small window. This results in windows containing fewer operations, leading to less potential for parallelism within windows, less freedom in scheduling, more synchronization, and greater likelihood of bursty behavior - all negative things.&lt;/p&gt;
+&lt;p&gt;The alternative offered by Synchronous Execution is that, when practical, operations of certain types can be partitioned (e.g. posts and likes could be partitioned by the forum in which they appear), and partitions assigned to driver processes. Using the social application example from above, if all posts and likes were partitioned by forum the driver process that executes the operations from any partition could simply execute them sequentially. Then the only dependency to maintain would be on user operations, reducing synchronization dramatically, and parallelism could still be achieved as each partition would be executed independently, in parallel, by a different driver process.&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: None: operation.DueT not modified by scheduler&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT and previousOperation.completed == true (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: 1&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: nextOperation.DueT - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: operation.DueT  Tolerated Delay E.g., if previousOperation did not complete in time, forcing current operation to wait for longer than the tolerated-delay&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;• Partially Synchronous&lt;/strong&gt; (Windowed Execution, described in Section 3.4 in more details), groups of operations from the same time window are executed together&lt;/p&gt;
+&lt;p&gt;– Re-scheduling Before Execution: Yes, as long as the following still holds:&lt;/p&gt;
+&lt;p&gt;window.startTime &amp;lt;= operation.DueT &amp;lt; window.startTime + window.duration&lt;/p&gt;
+&lt;p&gt;Operations within a window may be scheduled in any way, as long as they remain in the window from which they originated: their Due Times, and therefore ordering, may be modified&lt;/p&gt;
+&lt;p&gt;– Execute When time &amp;gt;= operation.DueT (and GCT &amp;gt;= operation.DepT)&lt;/p&gt;
+&lt;p&gt;– Max Concurrent Executions: number of operations within window&lt;/p&gt;
+&lt;p&gt;– Max Execution Time: (window.startTime + window.duration) - operation.DueT&lt;/p&gt;
+&lt;p&gt;– Failure: operation execution starts later than: window.startTime  window.duration operation execution does not finish by: window.startTime + window.duration&lt;/p&gt;
+&lt;h3 id=&#34;tying-it-back-to-ldbc-snb&#34;&gt;Tying it back to LDBC SNB&lt;/h3&gt;
+&lt;p&gt;The driver was designed to execute the workload of LDBC SNB. As discussed, the main challenge of running queries in parallel on graph-shaped data stem from dependencies introduced by the graph structure. In other words, workload partitioning becomes as hard as graph partitioning.&lt;/p&gt;
+&lt;p&gt;The LDBC SNB data can in fact be seen as a union of two parts:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;Core Data: relatively small and dense friendship graph (not more than 10% of the data). Updates on this part are very hard to partition among driver threads, since the graph is essentially a single dense strongly connected component.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;User Activity Data: posts, replies, likes; this is by far the biggest part of the data. Updates on this part are easily partitioned as long as the dependencies with the &amp;ldquo;core&amp;rdquo; part are satisfied (i.e., users don&amp;rsquo;t post things before the profiles are created, etc.).&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;In order to avoid friendship graph partitioning, the driver introduces the concept SafeT, the minimal simulation time that should pass between two dependent events.&lt;/p&gt;
+&lt;p&gt;This property is enforced by the data generator, i.e. the driver does not need to change or delay some operations in order to guarantee dependency safety. Respecting dependencies now means globally communicating the advances of the Global Completion Time, and making sure the operations do not start earlier than SafeT from their dependents.&lt;/p&gt;
+&lt;p&gt;On the other hand, the driver exploits the fact that some of the dependencies in fact do not hinder partitioning: although replies to the post can only be sent after the post is created, these kinds of dependencies are satisfied if we partition workload by forums. This way, all (update) operations on posts and comments from one forum are assigned to one driver thread. Since there is typically a lot of forums, each driver thread gets multiple ones. Updates from one forum are then run in Synchronous Execution Mode, and parallelism is achieved by running many distinct forums in parallel. By doing so, we can add posts and replies to forums at very high frequency without the need to communicate the GCT across driver instances (i.e. we efficiently create the so-called flash-mob effects in the posting/replying workload).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Running the Semantic Publishing Benchmark on Sesame, a Step by Step Guide</title>
+      <link>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</link>
+      <pubDate>Tue, 13 Jan 2015 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/running-the-semantic-publishing-benchmark-on-sesame-a-step-by-step-guide/</guid>
+      <description>&lt;p&gt;Until now we have discussed several aspects of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;Semantic Publishing Benchmark (SPB)&lt;/a&gt; such as the &lt;a href=&#34;https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark&#34;&gt;difference in performance between virtual and real servers configuration&lt;/a&gt;, how to choose an &lt;a href=&#34;https://ldbcouncil.org/post/making-semantic-publishing-execution-rules&#34;&gt;appropriate query mix&lt;/a&gt; for a benchmark run and our experience with using SPB in the development process of GraphDB for &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;finding performance issues&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;In this post we provide a step-by-step guide on how to run SPB using the &lt;a href=&#34;http://rdf4j.org/&#34;&gt;Sesame&lt;/a&gt; RDF data store on a fresh install of &lt;a href=&#34;http://releases.ubuntu.com/14.04.1/&#34;&gt;Ubuntu Server 14.04.1&lt;/a&gt;. The scenario is easy to adapt to other RDF triple stores which support the Sesame Framework used for querying and analyzing RDF data.&lt;/p&gt;
+&lt;h3 id=&#34;prerequisites&#34;&gt;Prerequisites&lt;/h3&gt;
+&lt;p&gt;We start with a fresh server installation, but before proceeding with setup of the Sesame Data Store and SPB benchmark we need the following pieces of software up and running:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Git&lt;/li&gt;
+&lt;li&gt;Apache Ant 1.8 or higher&lt;/li&gt;
+&lt;li&gt;OpenJDK 6 or Oracle JDK 6 or higher&lt;/li&gt;
+&lt;li&gt;Apache Tomcat 7 or higher&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;If you already have these components installed on your machine you can directly proceed to the next section: &lt;em&gt;Installing Sesame&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Following are sample commands which can be used to install the required software components:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install git
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install ant
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install default-jdk
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo apt-get install tomcat7
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Optionally Apache Tomcat Server can be downloaded as a zipped file and extracted in a location of choice.&lt;/p&gt;
+&lt;p&gt;After a successful installation of Apache Tomcat you should be able to get the default splash page &lt;em&gt;“It works”&lt;/em&gt; when you open your web browser and enter the following address:  http://&amp;lt;your_ip_address&amp;gt;:8080&lt;/p&gt;
+&lt;h3 id=&#34;installing-sesame&#34;&gt;Installing Sesame&lt;/h3&gt;
+&lt;p&gt;We will use current Sesame version 2.7.14. You can download it &lt;a href=&#34;http://sourceforge.net/projects/sesame/files/Sesame%202/&#34;&gt;here&lt;/a&gt; or run following command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;wget &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;http://sourceforge.net/projects/sesame/files/Sesame%202/2.7.14/openrdf-sesame-2.7.14-sdk.tar.gz/download&amp;#34;&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;\\&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  -O openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then extract the Sesame tarball:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;tar -xvzf openrdf-sesame-2.7.14-sdk.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To deploy sesame you have to copy the two war files that are in &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; to &lt;em&gt;/var/lib/tomcat7/webapps&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;From &lt;em&gt;openrdf-sesame-2.7.14/war&lt;/em&gt; you can do it with command:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;cp openrdf-*.war &amp;lt;tomcat_install&amp;gt;/webapps
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Sesame applications write and store configuration files in a single directory and the tomcat server needs permissions for it.&lt;/p&gt;
+&lt;p&gt;By default the configuration directory is: &lt;em&gt;/usr/share/tomcat7/.aduna&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Create the directory:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo mkdir /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then change the ownership:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chown tomcat7 /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;And finally you should give the necessary permissions:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;sudo chmod o+rwx /usr/share/tomcat7/.aduna
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Now when you go to: http://&amp;lt;your_ip_address&amp;gt;:8080/openrdf-workbench/repositories&lt;/p&gt;
+&lt;p&gt;You should get a screen like this:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;01-Sesame-repo-list.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;h3 id=&#34;setup-spb&#34;&gt;Setup SPB&lt;/h3&gt;
+&lt;p&gt;You can download the SPB code and find brief documentation on GitHub:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm&#34;&gt;https://github.com/ldbc/ldbc_spb_bm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;A detailed documentation is located here:&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&#34;&gt;https://github.com/ldbc/ldbc_spb_bm/blob/master/doc/LDBC_SPB_v0.3.pdf&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;SPB offers many configuration options which control various features of the benchmark e.g.:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;query mixes&lt;/li&gt;
+&lt;li&gt;dataset size&lt;/li&gt;
+&lt;li&gt;loading datasets&lt;/li&gt;
+&lt;li&gt;number of agents&lt;/li&gt;
+&lt;li&gt;validating results&lt;/li&gt;
+&lt;li&gt;test conformance to OWL2-RL ruleset&lt;/li&gt;
+&lt;li&gt;update rate of agents&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Here we demonstrate how to generate a dataset and execute a simple test&lt;br&gt;
+run with it.&lt;/p&gt;
+&lt;p&gt;First download the SPB source code from the repository:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;git clone https://github.com/ldbc/ldbc_spb_bm.git
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;Then in the ldbc_spb_bm directory build the project:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;ant build-basic-querymix
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;If you simply execute the command:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;ant
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;you’ll get a list of all available build configurations for the SPB test driver, but for the purpose of this step-by-step guide, configuration shown above is sufficient.&lt;/p&gt;
+&lt;p&gt;Depending on generated dataset size a bigger java heap size may be required for the Sesame Store. You can change it by adding following arguments to Tomcat&amp;rsquo;s startup files e.g. in &lt;em&gt;catalina.sh&lt;/em&gt;:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;export JAVA_OPTS&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;-d64 -Xmx4G&amp;#34;&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;To run the Benchmark you need to create a repository in the Sesame Data Store, similar to the following screenshot:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;02-Sesame-create-repo.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Then we need to point the benchmark test driver to the SPARQL endpoint of that repository. This is done in &lt;em&gt;ldbc_spb_bm/dist/test.properties&lt;/em&gt; file.&lt;/p&gt;
+&lt;p&gt;The default value of &lt;em&gt;datasetSize&lt;/em&gt; in the properties is set to be 10M, but for the purpose of this guide we will decrease it to 1M.&lt;/p&gt;
+&lt;p&gt;You need to change&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;datasetSize=1000000
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Also the URLs of the SPARQL endpoint for the repository&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;endpointURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1
+endpointUpdateURL=http://localhost:8080/openrdf-sesame/repositories/ldbc1/statements
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;First step, before measuring the performance of a triple store, is to load the reference-knowledge data, generate a 1M dataset, load it into the repository and finally generate query substitution parameters.&lt;/p&gt;
+&lt;p&gt;These are the settings to do that, following parameters will &amp;lsquo;instruct&amp;rsquo; the SPB test driver to perform all the actions described above:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Operational Phases
+loadOntologies=true
+loadReferenceDatasets=true
+generateCreativeWorks=true
+loadCreativeWorks=true
+generateQuerySubstitutionParameters=true
+validateQueryResults=false
+warmUp=false
+runBenchmark=false
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;To run the benchmark execute the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;java -jar semantic_publishing_benchmark-basic-standard.jar
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;test.properties
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;When the initial run has finished, we should have a 1M dataset loaded into the repository and a set of files with query substitution parameters.&lt;/p&gt;
+&lt;p&gt;Next we will measure the performance of Sesame Data Store by changing some configuration properties:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;#Benchmark Configuration Parameters
+warmupPeriodSeconds=60
+benchmarkRunPeriodSeconds=300
+...
+#Benchmark Operational Phases
+loadOntologies=false
+loadReferenceDatasets=false
+generateCreativeWorks=false
+loadCreativeWorks=false
+generateQuerySubstitutionParameters=false
+validateQueryResults=false
+warmUp=true
+runBenchmark=true
+runBenchmarkOnlineReplicationAndBackup=false
+checkConformance=false
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;After the benchmark test run has finished result files are saved in folder: &lt;em&gt;dist/logs&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;There you will find three types of results: the result summary of the benchmark run (&lt;em&gt;semantic_publishing_benchmark_results.log),&lt;/em&gt; brief results and detailed results.&lt;/p&gt;
+&lt;p&gt;In &lt;em&gt;semantic_publishing_benchmark_results.log&lt;/em&gt; you will find the results distributed per seconds. They should be similar to the listing bellow:&lt;/p&gt;
+&lt;p&gt;Benchmark Results for the 300-th second&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds : 300 (completed query mixes : 0)
+    Editorial:
+        2 agents
+
+        9     inserts (avg : 22484   ms, min : 115     ms, max : 81389   ms)
+        0     updates (avg : 0       ms, min : 0       ms, max : 0       ms)
+        0     deletes (avg : 0       ms, min : 0       ms, max : 0       ms)
+
+        9 operations (9 CW Inserts (0 errors), 0 CW Updates (1 errors), 0 CW Deletions (2 errors))
+        0.0300 average operations per second
+
+    Aggregation:
+        8 agents
+
+        2     Q1   queries (avg : 319     ms, min : 188     ms, max : 451     ms, 0 errors)
+        3     Q2   queries (avg : 550     ms, min : 256     ms, max : 937     ms, 0 errors)
+        1     Q3   queries (avg : 58380   ms, min : 58380   ms, max : 58380   ms, 0 errors)
+        2     Q4   queries (avg : 65250   ms, min : 40024   ms, max : 90476   ms, 0 errors)
+        1     Q5   queries (avg : 84220   ms, min : 84220   ms, max : 84220   ms, 0 errors)
+        2     Q6   queries (avg : 34620   ms, min : 24499   ms, max : 44741   ms, 0 errors)
+        3     Q7   queries (avg : 5892    ms, min : 4410    ms, max : 8528    ms, 0 errors)
+        2     Q8   queries (avg : 3537    ms, min : 546     ms, max : 6528    ms, 0 errors)
+        4     Q9   queries (avg : 148573  ms, min : 139078  ms, max : 169559  ms, 0 errors)
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;This step-by-step guide gave an introduction on how to setup and run the SPB on a Sesame Data Store. Further details can be found in the reference documentation listed above.&lt;/p&gt;
+&lt;p&gt;If you have any troubles running the benchmark, don&amp;rsquo;t hesitate to comment or use our social media channels.&lt;/p&gt;
+&lt;p&gt;In a future post we will go through some of the parameters of SPB and check their performance implications.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Semantic Publishing Instance Matching Benchmark</title>
+      <link>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</link>
+      <pubDate>Tue, 30 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/semantic-publishing-instance-matching-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Instance Matching Benchmark (SPIMBench) is a novel benchmark for the assessment of instance matching techniques for RDF data with an associated schema. SPIMBench extends the state-of-the art instance matching benchmarks for RDF data in three main aspects: it allows for systematic scalability testing, supports a wider range of test cases including semantics-aware ones, and provides an enriched gold standard.&lt;/p&gt;
+&lt;p&gt;The SPIMBench test cases provide a systematic way for testing the performance of instance matching systems in different settings. SPIMBench supports the types of test cases already adopted by existing instance matching benchmarks:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;value-based test cases based on applying value transformations (e.g., blank character addition and deletion, change of date format, abbreviations, synonyms) on triples relating to given input entity&lt;/li&gt;
+&lt;li&gt;structure-based test cases characterized by a structural transformation (e.g., different nesting levels for properties, property splitting, aggregation)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The novelty of SPIMBench lies in the support for the following semantics-aware test cases defined on the basis of OWL constructs:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;instance (in)equality (owl:sameAs, owl:differentFrom)&lt;/li&gt;
+&lt;li&gt;class and property equivalence (owl:equivalentClass, owl:equivalentProperty)&lt;/li&gt;
+&lt;li&gt;class and property disjointness (owl:disjointWith, owl:AllDisjointClasses, owl:propertyDisjointWith, owl:AllDisjointProperties)&lt;/li&gt;
+&lt;li&gt;class and property hierarchies (rdfs:subClassOf, rdfs:subPropertyOf)&lt;/li&gt;
+&lt;li&gt;property constraints (owl:FunctionalProperty, owl:InverseFunctionalProperty)&lt;/li&gt;
+&lt;li&gt;complex class definitions (owl:unionOf, owl:intersectionOf)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SPIMBench uses and extends the ontologies of LDBC&amp;rsquo;s Semantic Publishing Benchmark (SPB) to tackle the more complex schema constructs expressed in terms of OWL. It also extends SPB&amp;rsquo;s data generator to first generate a synthetic source dataset that does not contain any matches, and then to generate matches and non-matches to entities of the source dataset to address the supported transformations and OWL constructs. The data generation process allows the creation of arbitrary large datasets, thus supporting the evaluation of both the scalability and the matching quality of an instance matching system.&lt;/p&gt;
+&lt;p&gt;Value and structure-based test cases are implemented using the SWING framework &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt; on data and object type properties respectively. These are produced by applying the appropriate transformation(s) on a source instance to obtain a target instance. Semantics-based test cases are produced in the same way as with the value and structure-based test cases with the difference that appropriate triples are constructed and added in the target dataset to consider the respective OWL constructs.&lt;/p&gt;
+&lt;p&gt;SPIMBench, in addition to the semantics-based test cases that differentiate it from existing instance matching benchmarks, also offers a weighted gold standard used to judge the quality of answers of instance matching systems. It contains generated matches (a pair consisting of an entity of the source dataset and an entity of the target dataset) the type of test case it represents, the property on which a transformation was applied (in the case of value-based and structure-based test cases), and a weight that quantifies how easy it is to detect this match automatically. SPIMBench adopts an information-theoretical approach by applying multi-relational learning to compute the weight of the pair of matched instances by measuring the information loss that results from applying transformations to the source data to generate the target data. This detailed information, which is not provided by state of the art benchmarks, allows users of SPIMBench (e.g., developers of IM systems) to more easily identify the reasons underlying the performance results obtained using SPIMBench and thereby supports the debugging of instance matching systems.&lt;/p&gt;
+&lt;p&gt;SPIMBench can be downloaded from &lt;a href=&#34;https://github.com/jsaveta/SPIMBench&#34;&gt;our repository&lt;/a&gt; and a more thorough description thereof can be found on &lt;a href=&#34;http://www.ics.forth.gr/isl/spimbench/&#34;&gt;http://www.ics.forth.gr/isl/spimbench/&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] A. Ferrara, S. Montanelli, J. Noessner, and H. Stuckenschmidt. Benchmarking Matching Applications on the Semantic Web. In ESWC, 2011.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Further Developments in SNB BI Workload</title>
+      <link>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</link>
+      <pubDate>Thu, 18 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/further-developments-in-snb-bi-workload/</guid>
+      <description>&lt;p&gt;We are presently working on the SNB BI workload. Andrey Gubichev of TU Munchen and myself are going through the queries and are playing with two SQL based implementations, one on Virtuoso and the other on Hyper.&lt;/p&gt;
+&lt;p&gt;As discussed before, the BI workload has the same choke points as TPC-H as a base but pushes further in terms of graphiness and query complexity.&lt;/p&gt;
+&lt;p&gt;There are obvious marketing applications for a SNB-like dataset. There are also security related applications, ranging from fraud detection to intelligence analysis. The latter category is significant but harder to approach, as much of the detail of best practice is itself not in the open. In this post, I will outline some ideas discussed over time that might cristallize into a security related section in the SNB BI workload. We invite comments from practitioners for making the business questions more relevant while protecting sensitive details.&lt;/p&gt;
+&lt;p&gt;Let’s look at what scenarios would fit with the dataset. We have people, different kinds of connections between people, organizations, places and messages. Messages (posts/replies), people and organizations are geo-tagged. Making a finer level of geo-tagging, with actual GPS coordinates, travel itineraries etc, all referring to real places would make the data even more interesting. The geo dimension will be explored separately in a forthcoming post.&lt;/p&gt;
+&lt;p&gt;One of the first things to appear when approaching the question isthat the analysis of behavior patterns over time is not easily captured in purely declarative queries. For example, temporal sequence of events and the quantity and quality of interactions between players leads to intractably long queries which are hard to understand and debug. Therefore, views and intermediate materializations become increasingly necessary.&lt;/p&gt;
+&lt;p&gt;Another feature of the scene is that information is never complete. Even if logs are complete for any particular system, there are always possible interactions outside of the system. Therefore we tend to get match scores more then strictly Boolean conditions. Since everybody is related to everybody else via a relative short path, the nature and stremgth of the relationship is key to interpreting its significance.&lt;/p&gt;
+&lt;p&gt;Since a query consisting of scores and outer joins only is difficult to interpret and optimize, and since the information is seldom complete, some blanks may have to be filled in by guesses. The database must therefore contain metadata about this.&lt;/p&gt;
+&lt;p&gt;An orthogonal aspect to security applications is the access control of the database itself. One might assume that if a data warehouse of analyzable information is put together, the analyst would have access to the entirety of it. This is however not necessarily the case since the information itself and its provenance may fall under different compartments.&lt;/p&gt;
+&lt;p&gt;So, let’s see how some of these aspects could be captured in the SNB context.&lt;/p&gt;
+&lt;p&gt;Geography - We materialize a table of travel events, so that an unbroken sequence of posts from the same location (e.g. country) other than the residence of the poster forms a travel event. The posts may have a fine grained position (IP, GPS coordinates of photos) that marks an itinerary. This is already beyond basicSQL, needing a procedure or window functions.&lt;/p&gt;
+&lt;p&gt;The communication between people is implicit in reply threads and forum memberships. A reply is the closest that one comes to a person to person message in the dataset. Otherwise all content is posted to forumns with more or less participants. Membership in a high traffic forum with few participants would indicate a strong connection. Calculating these time varying connection strengths is a lot of work and a lot of text in queries. Keeping things simple requires materializing a sparse “adjacency cube,” i.e. a relation of person1, person2, time bucket -&amp;gt; connection strength. In the SNB case the connection strength may be derived from reciprocal replies, likes, being in the same forums, knowing each other etc. Selectivity is important, i.e. being in many small forumns together counts for more than being in ones where everybody else also participates.&lt;/p&gt;
+&lt;p&gt;The behaviors of people in SNB is not identical from person to person but for the same person follows a preset pattern. Suppose a question like “ which person with access to secrets has a marked change of online behavior?” The change would be starting or stopping communication with a given set of people, for example. Think that the spy meets the future spymaster in a public occasion, has a series of exchanges, travels to an atypical destination, then stops all open contact with the spymaster or related individuals. Patterns like this do not occur in the data but can be introduced easily enough.&lt;/p&gt;
+&lt;p&gt;In John Le Carre’s A Perfect Spy the main character is caught because it comes to light that his travel routes near always corresponded to his controller’s. This would make a query. This could be cast in marketing terms as a “(un)common shopping basket.”&lt;/p&gt;
+&lt;p&gt;Analytics becomes prediction when one part of a pattern exists without the expected next stage. Thus the same query template can serve for detecting full or partial instances of a pattern, depending on how the scores are interpreted.&lt;/p&gt;
+&lt;p&gt;From a database angle, these questions group on an item with internal structure. For the shopping basket this is a set. For the travel routes this is an ordered sequence of space/time points, with a match tolerance on the spatial and temporal elements. Another characteristic is that there is a baseline of expectations and the actual behavior. Both have structure, e.g. the occupation/location/interest/age of one’s social circle. These need to be condensed into a sort of metric space and then changes and rates of change can be observed. Again, this calls for a multidimensional cube to be created as a summary, then algorithms to be applied to this. The declarative BI query a la TPC-H does not easily capture this all.&lt;/p&gt;
+&lt;p&gt;This leads us to graph analytics in a broader sense. Some of the questions addressed here will still fit in the materialized summaries+declarative queries pattern but the more complex summarization and clustering moves towards iterative algorithms.&lt;/p&gt;
+&lt;p&gt;There is at present a strong interest in developing graph analytics benchmarks in LDBC. This is an activity that extends beyond the FP7 project duration and beyond the initial partners. To this effect I have implemented some SQL extensions for BSP style processing, as hinted at on my blog. These will be covered in more detail in January, when there are actual experiments.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Sizing AWS Instances for the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</link>
+      <pubDate>Wed, 17 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/sizing-aws-instances-for-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;LDBC&amp;rsquo;s &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (SPB) measures the performance of an RDF database in a load typical for metadata-based content publishing, such as the famous &lt;a href=&#34;http://www.bbc.co.uk/blogs/legacy/bbcinternet/2010/07/bbc_world_cup_2010_dynamic_sem.html&#34;&gt;BBC Dynamic Semantic Publishing&lt;/a&gt; scenario. Such load combines tens of updates per second (e.g. adding metadata about new articles) with even higher volume of read requests (SPARQL queries collecting recent content and data to generate web page on a specific subject, e.g. Frank Lampard). As we &lt;a href=&#34;https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues&#34;&gt;wrote earlier&lt;/a&gt;, SPB was already successfully used to help developers to identify performance issues and to introduce optimizations in SPARQL engines such as GraphDB and Virtuoso. Now we are at the point to experiment with different sizes of the benchmark and different hardware configurations.&lt;/p&gt;
+&lt;p&gt;Lately we tested different Amazon Web Services (&lt;a href=&#34;https://aws.amazon.com/&#34;&gt;AWS&lt;/a&gt;) instance types for running SPB basic interactive query mix in parallel with the standard editorial updates – precisely the type of workload that &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb/&#34;&gt;GraphDB&lt;/a&gt; experiences in the backend of BBC Sport website. We discovered and report below a number of practical guidelines about the optimal instance types and configurations. We have proven that SPB 50M workloads can be executed efficiently on a mid-sized AWS instance – c3.2xlarge machine executes 16 read queries and 15 update operations per second. For $1 paid to Amazon for such instance GraphDB executes 140 000 queries and 120 000 updates. The most interesting discovery in this experiment is that if BBC were hosting the triplestore behind their Dynamic Semantic Publishing architecture at AWS, the total cost of the server infrastructure behind their Worldcup 2010 website would have been about $80/day.&lt;/p&gt;
+&lt;h3 id=&#34;the-experiment&#34;&gt;The Experiment&lt;/h3&gt;
+&lt;p&gt;For our tests we use:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;GraphDB Standard v6.1&lt;/li&gt;
+&lt;li&gt;LDBC-SPB test driver (version 0.1.dc9a626 from 10.Nov.2014) configured as follows:
+&lt;ul&gt;
+&lt;li&gt;8 aggregation agents (read threads) and 2 editorial agents (write threads); for some configurations we experimented with different numbers of agents also&lt;/li&gt;
+&lt;li&gt;50M dataset (SF1)&lt;/li&gt;
+&lt;li&gt;40 minutes of benchmark run time (60 seconds of warm up)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;5 different Amazon EC2 instances and one local server&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Each test run is cold, i.e. data is newly loaded for each run. We set a 5 GByte cache configuration, which is sufficient for the size of the generated dataset. We use the same query substitution parameters (the same randomization seed) for every run, so that we are sure that all test runs are identical.&lt;/p&gt;
+&lt;p&gt;We use two types of instances – M3 and C3 instances. They both provide SSD storage for fast I/O performance. The M3 instances are with E5-2670v2, 2.50GHz CPU and provide good all-round performance, while the C3 instances are compute optimized with stronger CPU – E5-2680v2, 2.80GHz, but have half as much memory as the M3.&lt;/p&gt;
+&lt;p&gt;We also use a local physical server with dual-CPU – E5-2650v2, 2.60Ghz; 256GB of RAM and RAID-0 array of SSD in order to provide ground for interpretation of the performance for the virtualized AWS instances. The CPU capacity of the AWS instances is measured in vCPUs (virtual CPU). A vCPU is a logical core – one hyper-thread of one physical core of the corresponding Intel Xeon processor used by Amazon. This means that a vCPU represents roughly half a physical core, even though the performance of a hyper-threaded core is not directly comparable with two non-hyper-threaded cores. We should keep this in mind comparing AWS instances to physical machines, i.e. our local server with two CPUs with 8 physical cores each has 32 logical cores, which is more than c3.4xlarge instance with 16 vCPUs.&lt;/p&gt;
+&lt;h3 id=&#34;the-results&#34;&gt;The Results&lt;/h3&gt;
+&lt;p&gt;For the tests we measured:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;em&gt;queries/s&lt;/em&gt; for the read threads, where queries include SELECT and CONSTRUCT&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;updates/s&lt;/em&gt; for the write threads, where an update operation is INSERT or DELETE&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;queries/$&lt;/em&gt; and &lt;em&gt;updates/$&lt;/em&gt; – respectively queries or updates per dollar is calculated for each AWS instance type based on price and update throughput&lt;/li&gt;
+&lt;li&gt;&lt;em&gt;update/vCPU&lt;/em&gt; – modification operations per vCPU per second&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Results (Table 1.) provide strong evidence that performance depends mostly on processor power. This applies to both queries and updates - which in the current AWS setup go on par with one another. Comparing M3 and C3 instances with equal vCPUs we can see that performance is only slightly higher for the M3 machines and even lower for selects with 8 vCPUs. Taking into account the lower price of C3 because of their lower memory, it is clear that C3 machines are better suited for this type of workload and the sweet spot between price and performance is c3.2xlarge machine.&lt;/p&gt;
+&lt;p&gt;The improvement in performance between the c3.xlarge and c3.2xlarge is more than twofold where the improvement between c3.2xlarge and c3.4xlarge is considerably lower. We also observe slower growth between c3.4xlarge and the local server machine. This is an indication that for SPB at this scale the difference between 7.5GB and 15GB of RAM is substantial, but RAM above this amount cannot be utilized efficiently by GraphDB.&lt;/p&gt;
+&lt;p&gt;Table 1. SPB Measurement Results on AWS and Local Servers&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Server Type&lt;/th&gt;
+&lt;th&gt;vCPUs&lt;/th&gt;
+&lt;th&gt;R/W Agents&lt;/th&gt;
+&lt;th&gt;RAM (GB)&lt;/th&gt;
+&lt;th&gt;&amp;ldquo;Storage (GB, SSD)&amp;rdquo;&lt;/th&gt;
+&lt;th&gt;Price USD/h&lt;/th&gt;
+&lt;th&gt;Queries/ sec.&lt;/th&gt;
+&lt;th&gt;Updates/ sec.&lt;/th&gt;
+&lt;th&gt;Queries/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ USD&lt;/th&gt;
+&lt;th&gt;Updates/ vCPU&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;15&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.28&lt;/td&gt;
+&lt;td&gt;8.39&lt;/td&gt;
+&lt;td&gt;8.23&lt;/td&gt;
+&lt;td&gt;107 882&lt;/td&gt;
+&lt;td&gt;105 873&lt;/td&gt;
+&lt;td&gt;2.06&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;m3.2xlarge&lt;/td&gt;
+&lt;td&gt;8&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 80&lt;/td&gt;
+&lt;td&gt;0.56&lt;/td&gt;
+&lt;td&gt;15.44&lt;/td&gt;
+&lt;td&gt;15.67&lt;/td&gt;
+&lt;td&gt;99 282&lt;/td&gt;
+&lt;td&gt;100 752&lt;/td&gt;
+&lt;td&gt;1.96&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.xlarge&lt;/td&gt;
+&lt;td&gt;4&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;7.5&lt;/td&gt;
+&lt;td&gt;2x 40&lt;/td&gt;
+&lt;td&gt;0.21&lt;/td&gt;
+&lt;td&gt;7.17&lt;/td&gt;
+&lt;td&gt;6.78&lt;/td&gt;
+&lt;td&gt;122 890&lt;/td&gt;
+&lt;td&gt;116 292&lt;/td&gt;
+&lt;td&gt;1.7&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.2xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;15&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 80&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.42&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.46&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14.56&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;141 107&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;124 839&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.82&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;23.23&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;21.17&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;99 578&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;90 736&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.32&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;22.89&lt;/td&gt;
+&lt;td&gt;20.39&lt;/td&gt;
+&lt;td&gt;98 100&lt;/td&gt;
+&lt;td&gt;87 386&lt;/td&gt;
+&lt;td&gt;1.27&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/2&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.6&lt;/td&gt;
+&lt;td&gt;19.11&lt;/td&gt;
+&lt;td&gt;114 000&lt;/td&gt;
+&lt;td&gt;81 900&lt;/td&gt;
+&lt;td&gt;1.19&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;10/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;26.19&lt;/td&gt;
+&lt;td&gt;19.18&lt;/td&gt;
+&lt;td&gt;112 243&lt;/td&gt;
+&lt;td&gt;82 200&lt;/td&gt;
+&lt;td&gt;1.2&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;c3.4xlarge&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;14/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;2x 160&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;30.84&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;16.88&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;132 171&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;72 343&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;1.06&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;c3.4xlarge&lt;/td&gt;
+&lt;td&gt;16&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;30&lt;/td&gt;
+&lt;td&gt;2x 160&lt;/td&gt;
+&lt;td&gt;0.84&lt;/td&gt;
+&lt;td&gt;29.67&lt;/td&gt;
+&lt;td&gt;17.8&lt;/td&gt;
+&lt;td&gt;127 157&lt;/td&gt;
+&lt;td&gt;76 286&lt;/td&gt;
+&lt;td&gt;1.11&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.11&lt;/td&gt;
+&lt;td&gt;32.04&lt;/td&gt;
+&lt;td&gt;156 712&lt;/td&gt;
+&lt;td&gt;135 302&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;8/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;37.31&lt;/td&gt;
+&lt;td&gt;32.07&lt;/td&gt;
+&lt;td&gt;157 557&lt;/td&gt;
+&lt;td&gt;135 429&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&lt;strong&gt;Local&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;32&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;10/2&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;8x 256&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.85&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;40&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;31.01&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;168 916&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;130 952&lt;/strong&gt;&lt;/td&gt;
+&lt;td&gt;&lt;strong&gt;0.97&lt;/strong&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.39&lt;/td&gt;
+&lt;td&gt;26.42&lt;/td&gt;
+&lt;td&gt;153 672&lt;/td&gt;
+&lt;td&gt;111 569&lt;/td&gt;
+&lt;td&gt;0.83&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;14/3&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;36.22&lt;/td&gt;
+&lt;td&gt;26.39&lt;/td&gt;
+&lt;td&gt;152 954&lt;/td&gt;
+&lt;td&gt;111 443&lt;/td&gt;
+&lt;td&gt;0.82&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Local&lt;/td&gt;
+&lt;td&gt;32&lt;/td&gt;
+&lt;td&gt;20/2&lt;/td&gt;
+&lt;td&gt;256&lt;/td&gt;
+&lt;td&gt;8x 256&lt;/td&gt;
+&lt;td&gt;0.85&lt;/td&gt;
+&lt;td&gt;34.59&lt;/td&gt;
+&lt;td&gt;23.86&lt;/td&gt;
+&lt;td&gt;146 070&lt;/td&gt;
+&lt;td&gt;100 759&lt;/td&gt;
+&lt;td&gt;0.75&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;h3 id=&#34;the-optimal-number-of-test-agents&#34;&gt;The Optimal Number of Test Agents&lt;/h3&gt;
+&lt;p&gt;Experimenting with different number of aggregation (read) and editorial (write) agents at c3.4xlarge and the local server, we made some interesting observations:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;There is almost no benefit to use more than 2 write agents. This can be explained by the fact that certain aspects of handling writes in GraphDB are serialized, i.e. they cannot be executed in parallel across multiple write threads;&lt;/li&gt;
+&lt;li&gt;Using more read agents can have negative impact on update performance. This is proven by the c3.4xlarge results with 8/2 and with 14/2 agents - while in the later case GraphDB handles a bit higher amount of queries (31 vs. 23) we see a drop in the updates rates (from 21 to 17);&lt;/li&gt;
+&lt;li&gt;Overall, the configuration with 8 read agents and 2 write agents delivers good balanced results across various hardware configurations;&lt;/li&gt;
+&lt;li&gt;For machines with more than 16 cores, a configuration like 10/2 or 14/2, would maximize the number of selects, still with good update rates. This way one can get 30 queries/sec. on c3.4xlarge and 40 queries/sec. on a local server;&lt;/li&gt;
+&lt;li&gt;Launching more than 14 read agents does not help even on local server with 32 logical cores. This indicates that at this point we are reaching some constraints such as memory bandwidth or IO throughput and degree of parallelization.&lt;/li&gt;
+&lt;li&gt;There is some overhead when handling bigger number of agents as the results for the local server tests with 14/3 and 20/2 show the worst results for both queries and updates.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;efficiency-and-cost&#34;&gt;Efficiency and Cost&lt;/h3&gt;
+&lt;p&gt;AWS instance type c3.2xlarge provides the best price/performance ratio for applications where 15 updates/sec. are sufficient even at peak times. More intensive applications should use type c3.4xlarge, which guarantees more than 20 updates/sec.&lt;/p&gt;
+&lt;p&gt;Cloud infrastructure providers like Amazon, allow one to have a very clear account of the full cost for the server infrastructure, including hardware, hosting, electricity, network, etc.&lt;/p&gt;
+&lt;p&gt;$1 spent on c3.2xlarge ($0.41/hour) allows for handling 140 000 queries, along with more than 120 000 update operations!&lt;/p&gt;
+&lt;p&gt;The full cost of the server infrastructure is harder to compute in the case of purchasing a server and hosting it in a proprietary data center. Still, one can estimate the upper limits - for machine, like the local server used in this benchmark, this price is way lower than $1/hour. One should consider that this machine is with 256GB of RAM, which is an overkill for Semantic Publishing Benchmark ran at 50M scale. Under all these assumptions we see that using local server is cheaper than the most cost-efficient AWS instance. This is expected - owning a car is always cheaper than renting it for 3 years in a row. Actually, the fact that the difference of the prices/query in this case are low indicates that using AWS services comes at very low extra cost.&lt;/p&gt;
+&lt;p&gt;To put these figures in the context of a known real world application, let us model the case of a GraphDB Enterprise replication cluster with 2 master nodes and 6 worker nodes - the size of cluster that BBC used for their FIFA Worldcup 2010 project. Given c3.2xlarge instance type, the math works as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;100 queries/sec.&lt;/strong&gt; handled by the cluster. This means about 360 000 queries per hour or more than 4 million queries per day. This is at least 2 times more than the actual loads of GraphDB at BBC during the peak times of big sports events.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;10 updates/sec.&lt;/strong&gt; - the speed of updates in GraphDB Enterprise cluster is lower than the speed of each worker node in separation. There are relatively few content management applications that need more than 36 000 updates per hour.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;$81/day&lt;/strong&gt; is the full cost for the server infrastructure. This indicates an annual operational cost for cluster of this type in the range of $30 000, even without any effort to release some of the worker nodes in non-peak times.&lt;/li&gt;
+&lt;/ul&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: a Realistic Social Network Data Generator</title>
+      <link>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</link>
+      <pubDate>Sat, 06 Dec 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-a-realistic-social-network-data-generator/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;Getting started with snb&lt;/a&gt;, &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;DATAGEN: data generation for the Social Network Benchmark&lt;/a&gt;), Arnau Prat discussed the main features and characteristics of DATAGEN: &lt;em&gt;realism&lt;/em&gt;, &lt;em&gt;scalability&lt;/em&gt;, &lt;em&gt;determinism&lt;/em&gt;, &lt;em&gt;usability&lt;/em&gt;. DATAGEN is the social network data generator used by the three LDBC-SNB workloads, which produces data simulating the activity in a social network site during a period of time. In this post, we conduct a series of experiments that will shed some light on how realistic data produced by DATAGEN looks. For our testing, we generated a dataset of scale factor 10 (i.e., social network of 73K users during 3 years) and loaded it into Virtuoso by following the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;instructions for generating a SNB dataset&lt;/a&gt; and &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations/tree/master/interactive/virtuoso&#34;&gt;for loading the dataset into Virtuoso&lt;/a&gt;. In the following sections, we analyze several aspects of the generated dataset.&lt;/p&gt;
+&lt;h3 id=&#34;a-realistic-social-graph&#34;&gt;A Realistic social graph&lt;/h3&gt;
+&lt;p&gt;One of the most complexly structured graphs that can be found in the data produced by DATAGEN is the friends graph, formed by people and their &lt;em&gt;&lt;knows&gt;&lt;/em&gt; relationships. We used the R script after Figure 1 to draw the social degree distribution in the SNB friends graph. As shown in Figure 1, the cumulative social degree distribution of the friends graph is similar to that from Facebook (See the note about &lt;a href=&#34;https://www.facebook.com/notes/facebook-data-team/anatomy-of-facebook/10150388519243859&#34;&gt;Facebook Anatomy&lt;/a&gt;). This is not by chance, as DATAGEN has been designed to deliberately reproduce the Facebook&amp;rsquo;s graph distribution.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;Cumulative-distribution.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 1: Cumulative distribution #friends per user&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-r&#34; data-lang=&#34;r&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#R script for generating the social degree distribution &lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#75715e&#34;&gt;#Input files: person_knows_person_*.csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(data.table)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(igraph)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;library&lt;/span&gt;(plotrix)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;require&lt;/span&gt;(bit64)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;dflist &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;lapply&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;commandArgs&lt;/span&gt;(trailingOnly &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;TRUE&lt;/span&gt;), fread, sep&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;|&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  header&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;T, select&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;1&lt;/span&gt;&lt;span style=&#34;color:#f92672&#34;&gt;:&lt;/span&gt;&lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt;, colClasses&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;integer64&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  df &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; &lt;span style=&#34;color:#a6e22e&#34;&gt;rbindlist&lt;/span&gt;(dflist) &lt;span style=&#34;color:#a6e22e&#34;&gt;setNames&lt;/span&gt;(df, &lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P1&amp;#34;&lt;/span&gt;, &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;P2&amp;#34;&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;d2 &lt;span style=&#34;color:#f92672&#34;&gt;&amp;lt;-&lt;/span&gt; df[,&lt;span style=&#34;color:#a6e22e&#34;&gt;length&lt;/span&gt;(P2),by&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;P1]
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;pdf&lt;/span&gt;(&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;socialdegreedist.pdf&amp;#34;&lt;/span&gt;)
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;plot&lt;/span&gt;(&lt;span style=&#34;color:#a6e22e&#34;&gt;ecdf&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1),main&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Cummulative distribution #friends per user&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Number of friends&amp;#34;&lt;/span&gt;, ylab&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;Percentage number of users&amp;#34;&lt;/span&gt;, log&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#34;x&amp;#34;&lt;/span&gt;,
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  xlim&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;c&lt;/span&gt;(&lt;span style=&#34;color:#ae81ff&#34;&gt;0.8&lt;/span&gt;, &lt;span style=&#34;color:#a6e22e&#34;&gt;max&lt;/span&gt;(d2&lt;span style=&#34;color:#f92672&#34;&gt;$&lt;/span&gt;V1) &lt;span style=&#34;color:#f92672&#34;&gt;+&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;20&lt;/span&gt;))
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;dev.off&lt;/span&gt;()
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;h3 id=&#34;data-correlations&#34;&gt;Data Correlations&lt;/h3&gt;
+&lt;p&gt;Data in real life as well as in a real social network is correlated; e.g. names of people living in Germany have a different distribution than those living in Netherlands, people who went to the same university in the same period have a much higher probability to be friends and so on and so forth. In this experiment we will analyze if data produced by DATAGEN also reproduces these phenomena.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Which are the most popular names of a country?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query on the database built in Virtuoso, which computes the distribution of the names of the people for a given country. In this query, &lt;em&gt;&amp;lsquo;A_country_name&amp;rsquo;&lt;/em&gt; is the name of a particular country such as  &lt;em&gt;&amp;lsquo;Germany&amp;rsquo;, &amp;lsquo;Netherlands&amp;rsquo;, or &amp;lsquo;Vietnam&amp;rsquo;&lt;/em&gt;.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; p_lastname, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (p_lastname) &lt;span style=&#34;color:#66d9ef&#34;&gt;as&lt;/span&gt; namecnt 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;FROM&lt;/span&gt; person, country 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; ctry_city   
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;A_country_name&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; p_lastname &lt;span style=&#34;color:#66d9ef&#34;&gt;order&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;by&lt;/span&gt; namecnt &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we can see from Figures 2, 3, and 4, the distributions of names in Germany, Netherlands and Vietnam are different. A name that is popular in Germany such as &lt;em&gt;Muller&lt;/em&gt; is not popular in the Netherlands, and it even does not appear in the names of people in Vietnam.  We note that the names&amp;rsquo; distribution may not be exactly the same as the contemporary names&amp;rsquo; distribution in these countries, since the names resource files used in DATAGEN are extracted from Dbpedia, which may contain names from different periods of time.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-germany.png&#34; alt=&#34;image&#34;&gt; &lt;br&gt;
+Figure 2. Distribution of names in Germany&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-netherlands.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 3. Distribution of names in Netherlands&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;distribution-vietnam.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 4. Distribution of names in Vietnam&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are living?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;We run the following query, which computes the locations of the friends of people living in China.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; fctry.ctry_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt; (&lt;span style=&#34;color:#f92672&#34;&gt;*&lt;/span&gt;) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; person &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;, person
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;friend, country pctry, knows, country fctry 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; pctry.ctry_name &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;China&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_placeid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; pctry.ctry_city 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;self&lt;/span&gt;.p_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; friend.p_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; fctry.ctry_city &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; friend.p_placeid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; fctry.ctry_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;    
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As shown in the graph, most of the friends of people living in China are also living in China. The rest comes predominantly from near-by countries such as India, Vietnam.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;chinese-friends.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 5. Locations of friends of people in China&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Where my friends are studying?&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;Finally, we run the following query to find where the friends of people studying at a specific university (e.g., “Hangzhou_International_School”) are studying at.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-sql&#34; data-lang=&#34;sql&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;SELECT&lt;/span&gt; top &lt;span style=&#34;color:#ae81ff&#34;&gt;10&lt;/span&gt; o2.o_name, &lt;span style=&#34;color:#66d9ef&#34;&gt;count&lt;/span&gt;(o2.o_name) &lt;span style=&#34;color:#66d9ef&#34;&gt;from&lt;/span&gt; knows, person_university
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;p1, person_university p2, organisation o1, organisation o2 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;WHERE&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  p1.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o1.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; o1.o_name&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;&lt;span style=&#34;color:#e6db74&#34;&gt;&amp;#39;Hangzhou_International_School&amp;#39;&lt;/span&gt; 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; k_person1id &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; p1.pu_personid &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_personid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; k_person2id 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;  &lt;span style=&#34;color:#66d9ef&#34;&gt;and&lt;/span&gt; p2.pu_organisationid &lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt; o2.o_organisationid 
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#66d9ef&#34;&gt;GROUP&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; o2.o_name &lt;span style=&#34;color:#66d9ef&#34;&gt;ORDER&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;BY&lt;/span&gt; &lt;span style=&#34;color:#ae81ff&#34;&gt;2&lt;/span&gt; &lt;span style=&#34;color:#66d9ef&#34;&gt;desc&lt;/span&gt;;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;As we see from Figure 6, most of the friends of the Hangzhou International School students also study at that university. This is a realistic correlation, as people studying at the same university have a much higher probability to be friends. Furthermore, top-10 universities for the friends of the Hangzhou School students’ are from China, while people from foreign universities have small number of friends that study in Hangzhou School (See Table 1).&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;friends-international-school.png&#34; alt=&#34;&#34;&gt; &lt;br&gt;
+Figure 6. Top-10 universities where the friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Name&lt;/th&gt;
+&lt;th&gt;# of friends&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;Hangzhou_International_School&lt;/td&gt;
+&lt;td&gt;12696&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Anhui_University_of_Science_and_Technology&lt;/td&gt;
+&lt;td&gt;4071&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;China_Jiliang_University&lt;/td&gt;
+&lt;td&gt;3519&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;&amp;hellip;&lt;/td&gt;
+&lt;td&gt;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Darmstadt_University_of_Applied_Sciences&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Calcutta_School_of_Tropical_Medicine&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Chettinad_Vidyashram&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Women&amp;rsquo;s_College_Shillong&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;Universitas_Nasional&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;Table 1. Universities where friends of Hangzhou International School students are studying at.&lt;/p&gt;
+&lt;p&gt;In a real social network, data is riddled with many more correlations; it is a true data mining task to extract these.  Even though DATAGEN may not be able to model all the real life data correlations, it can generate a dataset that reproduce many of those important characteristics found in a real social network, and additionally introduce a series of plausible correlations in it. More and more interesting data correlations may also be found from playing with the SNB generated data.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Driver - Part 1</title>
+      <link>https://ldbcouncil.org/post/snb-driver-part-1/</link>
+      <pubDate>Thu, 27 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-driver-part-1/</guid>
+      <description>&lt;p&gt;In this multi-part blog we consider the challenge of running the LDBC Social Network Interactive Benchmark (LDBC SNB) workload in parallel, i.e. the design of the workload driver that will issue the queries against the System Under Test (SUT). We go through design principles that were implemented for the LDBC SNB workload generator/load tester (simply referred to as driver). Software and documentation for this driver is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/&#34;&gt;https://github.com/ldbc/ldbc_driver/&lt;/a&gt;. Multiple reference implementations by two vendors are available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_implementations&#34;&gt;https://github.com/ldbc/ldbc_snb_implementations&lt;/a&gt;, and discussion of the schema, data properties, and related content is available here: &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;https://github.com/ldbc/ldbc_snb_docs&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The following will concentrate on key decisions and techniques that were developed to support scalable, repeatable, distributed workload execution.&lt;/p&gt;
+&lt;h3 id=&#34;problem-description&#34;&gt;Problem Description&lt;/h3&gt;
+&lt;p&gt;The driver generates a stream of operations (e.g. create user, create post, create comment, retrieve person&amp;rsquo;s posts etc.) and then executes them using the provided database connector. To be capable of generating heavier loads, it executes the operations from this stream in parallel. If there were no dependencies between operations (e.g., reads that depend on the completion of writes) this would be trivial. This is the case, for example, for the classical TPC-C benchmark, where splitting transaction stream into parallel clients (terminals) is trivial. However, for LDBC SNB Interactive Workload this is not the case: some operations within the stream do depend on others, others are depended on, some both depend on others and are depended on, and some neither depend on others nor are they depended on.&lt;/p&gt;
+&lt;p&gt;Consider, for example, a Social Network Benchmark scenario, where the data generator outputs a sequence of events such as User A posted a picture, User B left a comment to the picture of User A, etc. The second event depends on the first one in a sense that there is a causal ordering between them: User B can only leave a comment on the picture once it has been posted. The generated events are already ordered by their time stamp, so in case of the single-threaded execution this ordering is observed by default: the driver issues a request to the SUT with the first event (i.e., User A posts a picture), after its completion it issues the second event (create a comment). However, if events are executed in parallel, these two events may end up in different parallel sequences of events. Therefore, a driver needs a mechanism to ensure the dependency is observed even when the dependent events are in different parallel update streams.&lt;/p&gt;
+&lt;p&gt;The next blog entries in this series will discuss the approaches used in the driver to deal with these challenges.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making Semantic Publishing Execution Rules</title>
+      <link>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</link>
+      <pubDate>Tue, 18 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-semantic-publishing-execution-rules/</guid>
+      <description>&lt;p&gt;&lt;a href=&#34;https://ldbcouncil.org/&#34;&gt;LDBC&lt;/a&gt; &lt;a href=&#34;https://ldbcouncil.org/benchmarks/spb&#34;&gt;SPB (Semantic Publishing Benchmark)&lt;/a&gt; is based on the BBC linked data platform use case. Thus the data modelling and transaction mix reflects the BBC&amp;rsquo;s actual utilization of RDF. But a benchmark is not only a condensation of current best practices. The BBC linked data platform is an &lt;a href=&#34;https://www.ontotext.com/products/ontotext-graphdb-owlim/&#34;&gt;Ontotext Graph DB&lt;/a&gt; deployment. Graph DB was formerly known as Owlim.&lt;/p&gt;
+&lt;p&gt;So, in SPB we wanted to address substantially more complex queries than the lookups that the BBC linked data platform primarily serves. Diverse dataset summaries, timelines and faceted search qualified by keywords and/or geography are examples of online user experience that SPB needs to cover.&lt;/p&gt;
+&lt;p&gt;SPB is not per se an analytical workload but we still find that the queries fall broadly in two categories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries are centred on a particular search or entity. The data touched by the query size does not grow at the same rate as the dataset.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Some queries cover whole cross sections of the dataset, e.g. find the most popular tags across the whole database.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;These different classes of questions need to be separated in a metric, otherwise the short lookup dominates at small scales and the large query at large scales.&lt;/p&gt;
+&lt;p&gt;Another guiding factor of SPB was the BBC&amp;rsquo;s and others&amp;rsquo; express wish to cover operational aspects such as online backups, replication and fail-over in a benchmark. True, most online installations have to deal with these things, which are yet as good as absent from present benchmark practice. We will look at these aspects in a different article, for now, I will just discuss the matter of workload mix and metric.&lt;/p&gt;
+&lt;p&gt;Normally the lookup and analytics workloads are divided into different benchmarks. Here we will try something different. There are three things the benchmark does:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Updates - These sometimes insert a graph, sometimes delete and re-insert the same graph, sometimes just delete a graph. These are logarithmic to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Short queries - These are lookups that most often touch on recent data and can drive page impressions. These are roughly logarithmic to data scale.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Analytics - These cover a large fraction of the dataset and are roughly linear to data size.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A test sponsor can decide on the query mix within certain bounds. A qualifying run must sustain a minimum, scale-dependent update throughput and must execute a scale-dependent number of analytical query mixes or run for a scale-dependent duration. The minimum update rate, the minimum number of analytics mixes and the minimum duration all grow logarithmically to data size. Within these limits, the test sponsor can decide how to mix the workloads. Publishing several results, emphasizing different aspects is also possible. A given system may be specially good at one aspect, leading the test sponsor to accentuate this.&lt;/p&gt;
+&lt;p&gt;The benchmark has been developed and tested at small scales, between 50 and 150M triples. Next we need to see how it actually scales. There we expect to see how the two query sets behave differently. One effect that we see right away when loading data is that creating the full text index on the literals is in fact the longest running part. For a SF 32 ( 1.6 billion triples) SPB database we have the following space consumption figures:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;46886 MB of RDF literal text&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23924 MB of full text index for RDF literals&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;23598 MB of URI strings&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;21981 MB of quads, stored column-wise with default index scheme&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Clearly, applying column-wise compression to the strings is the best move for increasing scalability. The literals are individually short, so literal per literal compression will do little or nothing but applying this by the column is known to get a 2x size reduction with Google Snappy. The full text index does not get much from column store techniques, as it already consists of words followed by space efficient lists of word positions. The above numbers are measured with Virtuoso column store, with quads column wise and the rest row-wise. Each number includes the table(s) and any extra indices associated to them.&lt;/p&gt;
+&lt;p&gt;Let&amp;rsquo;s now look at a full run at unit scale, i.e. 50M triples.&lt;/p&gt;
+&lt;p&gt;The run rules stipulate a minimum of 7 updates per second. The updates are comparatively fast, so we set the update rate to 70 updates per second. This is seen not to take too much CPU. We run 2 threads of updates, 20 of short queries and 2 of long queries. The minimum run time for the unit scale is 10 minutes, so we do 10 analytical mixes, as this is expected to take 10 a little over 10 minutes. The run stops by itself when the last of the analytical mixes finishes.&lt;/p&gt;
+&lt;p&gt;The interactive driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 2144
+    Editorial:
+        2 agents
+
+        68164 inserts (avg : 46      ms, min : 5       ms, max : 3002    ms)
+        8440  updates (avg : 72      ms, min : 15      ms, max : 2471    ms)
+        8539  deletes (avg : 37      ms, min : 4       ms, max : 2531    ms)
+
+        85143 operations (68164 CW Inserts (98 errors), 8440 CW Updates (0 errors), 8539 CW Deletions (0 errors))
+        39.7122 average operations per second
+
+    Aggregation:
+        20 agents
+
+        4120  Q1   queries (avg : 789     ms, min : 197     ms, max : 6767    ms, 0 errors)
+        4121  Q2   queries (avg : 85      ms, min : 26      ms, max : 3058    ms, 0 errors)
+        4124  Q3   queries (avg : 67      ms, min : 5       ms, max : 3031    ms, 0 errors)
+        4118  Q5   queries (avg : 354     ms, min : 3       ms, max : 8172    ms, 0 errors)
+        4117  Q8   queries (avg : 975     ms, min : 25      ms, max : 7368    ms, 0 errors)
+        4119  Q11  queries (avg : 221     ms, min : 75      ms, max : 3129    ms, 0 errors)
+        4122  Q12  queries (avg : 131     ms, min : 45      ms, max : 1130    ms, 0 errors)
+        4115  Q17  queries (avg : 5321    ms, min : 35      ms, max : 13144   ms, 0 errors)
+        4119  Q18  queries (avg : 987     ms, min : 138     ms, max : 6738    ms, 0 errors)
+        4121  Q24  queries (avg : 917     ms, min : 33      ms, max : 3653    ms, 0 errors)
+        4122  Q25  queries (avg : 451     ms, min : 70      ms, max : 3695    ms, 0 errors)
+
+        22.5239 average queries per second. Pool 0, queries [ Q1 Q2 Q3 Q5 Q8 Q11 Q12 Q17 Q18 Q24 Q25 ]
+
+        45318 total retrieval queries (0 timed-out)
+        22.5239 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The analytical driver reports:&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Aggregation:
+        2 agents
+
+        14    Q4   queries (avg : 9984    ms, min : 4832    ms, max : 17957   ms, 0 errors)
+        12    Q6   queries (avg : 4173    ms, min : 46      ms, max : 7843    ms, 0 errors)
+        13    Q7   queries (avg : 1855    ms, min : 1295    ms, max : 2415    ms, 0 errors)
+        13    Q9   queries (avg : 561     ms, min : 446     ms, max : 662     ms, 0 errors)
+        14    Q10  queries (avg : 2641    ms, min : 1652    ms, max : 4238    ms, 0 errors)
+        12    Q13  queries (avg : 595     ms, min : 373     ms, max : 1167    ms, 0 errors)
+        12    Q14  queries (avg : 65362   ms, min : 6127    ms, max : 136346  ms, 2 errors)
+        13    Q15  queries (avg : 45737   ms, min : 12698   ms, max : 59935   ms, 0 errors)
+        13    Q16  queries (avg : 30939   ms, min : 10224   ms, max : 38161   ms, 0 errors)
+        13    Q19  queries (avg : 310     ms, min : 26      ms, max : 1733    ms, 0 errors)
+        12    Q20  queries (avg : 13821   ms, min : 11092   ms, max : 15435   ms, 0 errors)
+        13    Q21  queries (avg : 36611   ms, min : 14164   ms, max : 70954   ms, 0 errors)
+        13    Q22  queries (avg : 42048   ms, min : 7106    ms, max : 74296   ms, 0 errors)
+        13    Q23  queries (avg : 48474   ms, min : 18574   ms, max : 93656   ms, 0 errors)
+        0.0862 average queries per second. Pool 0, queries [ Q4 Q6 Q7 Q9 Q10 Q13 Q14 Q15 Q16 Q19 Q20 Q21 Q22 Q23 ]
+
+        180 total retrieval queries (2 timed-out)
+        0.0862 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;The metric would be 22.52 qi/s, 310 qa/h, 39.7 u/s @ 50Mt (SF 1)&lt;/p&gt;
+&lt;p&gt;The SUT is dual Xeon E5-2630, all in memory. The platform utilization is steadily above 2000% CPU (over 20/24 hardware threads busy on the DBMS). The DBMS is Virtuoso open source, (&lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/&#34;&gt;v7fasttrack at github.com&lt;/a&gt;, &lt;a href=&#34;https://github.com/v7fasttrack/virtuoso-opensource/tree/feature/analytics&#34;&gt;feature/analytics&lt;/a&gt;).&lt;/p&gt;
+&lt;p&gt;The minimum update rate of 7/s was sustained but fell short of the target of 70./s. In this run, most demand was put on the interactive queries. Different thread allocations would give different ratios of the metric components. The analytics mix is for example about 3x faster without other concurrent activity.&lt;/p&gt;
+&lt;p&gt;Is this good or bad? I would say that this is possible but better can certainly be accomplished.&lt;/p&gt;
+&lt;p&gt;The initial observation is that Q17 is the worst of the interactive lot. 3x better is easily accomplished by avoiding a basic stupidity. The query does the evil deed of checking for a substring in a URI. This is done in the wrong place and accounts for most of the time. The query is meant to test geo retrieval but ends up doing something quite different. Optimizing this right would almost double the interactive score. There are some timeouts in the analytical run, which as such disqualifies the run. This is not a fully compliant result but is close enough to give an idea of the dynamics. So we see that the experiment is definitely feasible, is reasonably defined and that the dynamics seen make sense.&lt;/p&gt;
+&lt;p&gt;As an initial comment of the workload mix, I&amp;rsquo;d say that interactive should have a few more very short point lookups to stress compilation times and give a higher absolute score of queries per second.&lt;/p&gt;
+&lt;p&gt;Adjustments to the mix will depend on what we find out about scaling. As with SNB, it is likely that the workload will shift a little, so this result might not be comparable with future ones.&lt;/p&gt;
+&lt;p&gt;In the next SPB article, we will look closer at performance dynamics and choke points and will have an initial impression on scaling the workload.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fifth TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/fifth-tuc-meeting/</link>
+      <pubDate>Fri, 14 Nov 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fifth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce its fifth Technical User&lt;br&gt;
+Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at the National Hellenic Research Institute&lt;br&gt;
+in Athens, Greece on &lt;strong&gt;Friday November 14, 2014&lt;/strong&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;10:30 - 11:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;11:00 - 11:10 Peter Boncz (VUA)  Welcome &amp;amp; LDBC project status update (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979841.pptx&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:10 - 11:25 Venelin Kotsev (ONTO) Semantic Publishing Benchmark:Short Presentation of SPB and Status&lt;/p&gt;
+&lt;p&gt;Feedback &amp;amp; Roadmap for SPB &amp;amp; OWLIM (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979839.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:25 - 11:30 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SPB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979828.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:30 - 11:45 Alex Averbuch (NEO) Social Network Benchmark: Short Presentation of SNB and  Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Neo4J (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979830.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;11:45 - 12:00 Orri Erling (OGL) Status, Feedback &amp;amp; Roadmap for SNB &amp;amp; Virtuoso (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979829.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:00 - 12:20 Arnau Prat (UPC) &amp;amp; Andrey Gubichev Status, Feedback &amp;amp; Roadmap for SNB Interactive &amp;amp; Sparksee (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979836.pdf&#34;&gt;Presentation&lt;/a&gt; ) and Business Intelligence (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979837.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;12:20 - 12:40 Tomer Sagi,  &amp;ldquo;Experience with SNB and TitanDB at HP&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979838.pptx&#34;&gt;Presentation&lt;/a&gt; )&lt;/p&gt;
+&lt;p&gt;12:40 - 13:00 Jakob Nelson,   &amp;ldquo;graphbench.org on the SNB datagen&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;13:00 - 14:30 Lunch Break@Byzantine &amp;amp; Christian Museum (&lt;a href=&#34;http://www.byzantinemuseum.gr/en/&#34;&gt;link&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;14:30 - 14:50 Olaf Hartig, &amp;ldquo;Integrating the Property Graph and RDF data models&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979831.pdf&#34;&gt;Presentation&lt;/a&gt;)\&lt;/p&gt;
+&lt;p&gt;Documents: &lt;a href=&#34;http://arxiv.org/abs/1409.3288&#34;&gt;arxiv/1409.3288&lt;/a&gt;, &lt;a href=&#34;http://arxiv.org/abs/1406.3399&#34;&gt;arxiv/1406.3399&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;14:50 - 15:10 Maria-Esther Vidal and Maribel Acosta, &amp;ldquo;Challenges to be addressed during Benchmarking SPARQL Federated Engines&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979842.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:10 - 15:30 Evaggelia Pitoura, &amp;ldquo;Historical Queries on Graphs&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979835.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;15:30 - 16:00 Coffee Break&lt;/p&gt;
+&lt;p&gt;16:00 - 16:20 Manolis Terrovitis, Giannis Liagos, George Papastefanatos, &amp;ldquo;Efficient Identification of Implicit Facts in Incomplete OWL2-EL Knowledge Bases&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979843.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:20 - 16:40 Gunes Aluc, &amp;ldquo;WatDiv: How to Tune-up your RDF Data Management System&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979832.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;16:40 - 17:00 Giorgos Kollias, Yannis Smaragdakis, &amp;ldquo;Benchmarking @LogicBlox&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979840.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:00 - 17:15 Hassan Chafi, &amp;ldquo;Oracle Labs Graph Strategy&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:15 - 17:25 Yinglong Xia, &amp;ldquo;Property Graphs for Industry Solution at IBM&amp;rdquo; (&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/6979834.pdf&#34;&gt;Presentation&lt;/a&gt;)&lt;/p&gt;
+&lt;p&gt;17:25 - 17:30 Arthur Keen, &amp;ldquo;Short Introduction to SPARQLcity&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;20:30 Dinner @ Konservokouti &lt;a href=&#34;https://plus.google.com/114240752029716758955/about?gl=gr&amp;amp;hl=en&#34;&gt;(link)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;&lt;strong&gt;Get a Taxi, and go to Ippokratous 148, Athens, Neapoli Exarheion&lt;/strong&gt;&lt;/em&gt;&lt;/p&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;p&gt;The meeting will be held at the &lt;a href=&#34;http://www.eie.gr/index-en.html&#34;&gt;National Hellenic Research Foundation&lt;/a&gt; located in &lt;a href=&#34;http://www.eie.gr/location-en.html&#34;&gt;downtown Athens&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fifth-tuc-meeting/attachments/5996808/5964344.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;travel&#34;&gt;Travel&lt;/h4&gt;
+&lt;p&gt;Athens, Greece&amp;rsquo;s capital city, is easily accessible by air. Travelers on flights to Athens will land at Athens Eleftherios Venizelos International Airport.&lt;/p&gt;
+&lt;p&gt;To arrive in the city center, you can take the metro from the airport (Line #3) and stop at either stop Evangelismos (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations. You can also take express Bus X95 and stop again at either Evangelismos  (ΕΥΑΓΓΕΛΙΣΜΟΣ) or at Syntagma (ΣΥΝΤΑΓΜΑ) stations (the latter is the terminus for the bus).&lt;/p&gt;
+&lt;p&gt;You can also take a taxi from the airport that runs on a fixed price for the city center (45 euros). More information on how to move around in Athens from the airport can be found here: &lt;a href=&#34;http://www.aia.gr/traveler/&#34;&gt;http://www.aia.gr/traveler/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With the Semantic Publishing Benchmark</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</link>
+      <pubDate>Sun, 09 Nov 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-the-semantic-publishing-benchmark/</guid>
+      <description>&lt;p&gt;The Semantic Publishing Benchmark (SPB), developed in the context of LDBC, aims at measuring the read and write operations that can be performed in the context of a media organisation. It simulates the management and consumption of RDF metadata describing media assets and creative works. The scenario is based around a media organisation that maintains RDF descriptions of its catalogue of creative works. These descriptions use a set of ontologies proposed by BBC that define numerous properties for content; they contain asll RDFS schema constructs and certain OWL ones.&lt;/p&gt;
+&lt;p&gt;The benchmark proposes a data generator that uses the ontologies provided by BBC and reference datasets (again provided by BBC) to produce a set of valid instances; it works with a predefined set of distributions derived from the reference datasets. In addition to these distributions, the data generator also models:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;clustering of creative works around certain entities from the reference datasets (e.g. the association of an entity with creative works would decay exponentially in time)&lt;/li&gt;
+&lt;li&gt;correlations between entities -  there will be creative works about two entities for a certain period in time, that way a history of interactions is also modelled (e.g. J. Biden and B. Obama are tagged in creative works for a continuous period in time)&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The driver proposed by the benchmark measures the performance of CRUD operations of a SPARQL endpoint by starting a number of concurrently running editorial and aggregation agents. The former executes a series of insert, update and delete operations, whereas the latter a set of construct, describe, and select queries on a SPARQL endpoint. The benchmark can access all SPARQL endpoints that support the SPARQL 1.1 protocol. Tests have been run on OWLIM and Virtuoso. Attempts were also made for Stardog.&lt;/p&gt;
+&lt;p&gt;Currently, the benchmark offers two workloads: a base version that consists of a mix of nine queries of different complexity that consider nearly all the features of SPARQL 1.1 query language including sorting, subqueries, limit,  regular expressions and grouping. The queries aim at checking different choke points relevant to query optimisation such as:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;join ordering based on cardinality constraints - expressed by the different kinds of properties defined in the schema&lt;/li&gt;
+&lt;li&gt;subselects that aggregate the query results that the optimiser should recognise and evaluate first&lt;/li&gt;
+&lt;li&gt;optional and nested optional clauses where the optimiser is called to produce a plan where the execution of the optional triple patterns is performed last&lt;/li&gt;
+&lt;li&gt;reasoning along the RDFS constructs (subclass, subproperty hierarchies, functional, object and transitive properties etc.)&lt;/li&gt;
+&lt;li&gt;unions to be executed in parallel&lt;/li&gt;
+&lt;li&gt;optionals that contain filter expressions that should be executed as early as possible in order to eliminate intermediate results&lt;/li&gt;
+&lt;li&gt;ordering where the optimiser could consider the possibility to choose query plan(s) that facilitate the ordering of results&lt;/li&gt;
+&lt;li&gt;handling of geo-spatial predicates&lt;/li&gt;
+&lt;li&gt;full-text search optimisation&lt;/li&gt;
+&lt;li&gt;asynchronous execution of the aggregate sub-queries&lt;/li&gt;
+&lt;li&gt;use of distinct to choose the optimal query plan&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We give below Query 1 of the Semantic Publishing Benchmark.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;PREFIX bbcevent:&amp;lt;http://www.bbc.co.uk/ontologies/event/&amp;gt;
+PREFIX geo-pos:&amp;lt;http://www.w3.org/2003/01/geo/wgs84_pos#&amp;gt;
+PREFIX bbc:&amp;lt;http://www.bbc.co.uk/ontologies/bbc/&amp;gt;
+PREFIX time:&amp;lt;http://www.w3.org/2006/time#&amp;gt;
+PREFIX event:&amp;lt;http://purl.org/NET/c4dm/event.owl#&amp;gt;
+PREFIX music-ont:&amp;lt;http://purl.org/ontology/mo/&amp;gt;
+PREFIX rdf:&amp;lt;http://www.w3.org/1999/02/22-rdf-syntax-ns#&amp;gt;
+PREFIX foaf:&amp;lt;http://xmlns.com/foaf/0.1/&amp;gt;
+PREFIX provenance:&amp;lt;http://www.bbc.co.uk/ontologies/provenance/&amp;gt;
+PREFIX owl:&amp;lt;http://www.w3.org/2002/07/owl#&amp;gt;
+PREFIX cms:&amp;lt;http://www.bbc.co.uk/ontologies/cms/&amp;gt;
+PREFIX news:&amp;lt;http://www.bbc.co.uk/ontologies/news/&amp;gt;
+PREFIX cnews:&amp;lt;http://www.bbc.co.uk/ontologies/news/cnews/&amp;gt;
+PREFIX cconcepts:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX dbp-prop:&amp;lt;http://dbpedia.org/property/&amp;gt;
+PREFIX geonames:&amp;lt;http://sws.geonames.org/&amp;gt;
+PREFIX rdfs:&amp;lt;http://www.w3.org/2000/01/rdf-schema#&amp;gt;
+PREFIX domain:&amp;lt;http://www.bbc.co.uk/ontologies/domain/&amp;gt;
+PREFIX dbpedia:&amp;lt;http://dbpedia.org/resource/&amp;gt;
+PREFIX geo-ont:&amp;lt;http://www.geonames.org/ontology#&amp;gt;
+PREFIX bbc-pont:&amp;lt;http://purl.org/ontology/po/&amp;gt;
+PREFIX tagging:&amp;lt;http://www.bbc.co.uk/ontologies/tagging/&amp;gt;
+PREFIX sport:&amp;lt;http://www.bbc.co.uk/ontologies/sport/&amp;gt;
+PREFIX skosCore:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX dbp-ont:&amp;lt;http://dbpedia.org/ontology/&amp;gt;
+PREFIX xsd:&amp;lt;http://www.w3.org/2001/XMLSchema#&amp;gt;
+PREFIX core:&amp;lt;http://www.bbc.co.uk/ontologies/coreconcepts/&amp;gt;
+PREFIX curric:&amp;lt;http://www.bbc.co.uk/ontologies/curriculum/&amp;gt;
+PREFIX skos:&amp;lt;http://www.w3.org/2004/02/skos/core#&amp;gt;
+PREFIX cwork:&amp;lt;http://www.bbc.co.uk/ontologies/creativework/&amp;gt;
+PREFIX fb:&amp;lt;http://rdf.freebase.com/ns/&amp;gt;
+
+# Query Name : query1
+# Query Description :
+# Retrieve creative works about thing t (or that mention t)
+# reasoning: rdfs:subClassOf, rdf:type
+# join ordering: cwork:dateModified rdf:type owl:FunctionalProperty
+# join ordering: cwork:dateCreated rdf:type owl:FunctionalProperty
+# Choke Points :
+# - join ordering based on cardinality of functional proerties cwork:dateCreated, cwork:dateModified
+# Optimizer should use an efficient cost evaluation method for choosing the optimal join tree
+# - A sub-select which aggregates results. Optimizer should recognize it and execute it first
+# - OPTIONAL and nested OPTIONAL clauses (treated by query optimizer as nested sub-queries)
+# Optimizer should decide to put optional triples on top of the join tree
+# (i.e. delay their execution to the last possible moment) because OPTIONALs are treated as a left join
+# - qiery optimizer has the chance to recognize the triple pattern : ?cWork a ?type . ?type rdfs:subClassOf cwork:CreativeWork
+# and eliminate first triple (?cwork a ?type .) since ?cwork is a cwork:CreativeWork​
+
+CONSTRUCT {
+  ?creativeWork a cwork:CreativeWork ;
+   a ?type ;
+   cwork:title ?title ;
+   cwork:shortTitle ?shortTitle ;
+   cwork:about ?about ;
+   cwork:mentions ?mentions ;
+   cwork:dateCreated ?created ;
+   cwork:dateModified ?modified ;
+   cwork:description ?description ;
+   cwork:primaryFormat ?primaryFormat ;
+   bbc:primaryContentOf ?webDocument .
+  ?webDocument bbc:webDocumentType ?webDocType .
+  ?about rdfs:label ?aboutLabel ;
+   bbc:shortLabel ?aboutShortLabel ;
+   bbc:preferredLabel ?aboutPreferredLabel .
+  ?mentions rdfs:label ?mentionsLabel ;
+   bbc:shortLabel ?mentionsShortLabel ;
+   bbc:preferredLabel ?mentionsPreferredLabel .
+  ?creativeWork cwork:thumbnail ?thumbnail .
+  ?thumbnail a cwork:Thumbnail ;
+   cwork:altText ?thumbnailAltText ;
+   cwork:thumbnailType ?thumbnailType .
+}
+WHERE {
+  {
+   SELECT ?creativeWork
+    WHERE {
+        ?creativeWork {{{cwAboutOrMentions}}} {{{cwAboutOrMentionsUri}}} .
+        ?creativeWork a cwork:CreativeWork ;
+        cwork:dateModified ?modified .
+     }
+    ORDER BY DESC(?modified)
+    LIMIT 10
+  }
+  ?creativeWork a cwork:CreativeWork ;
+         a ?type ;
+         cwork:title ?title ;
+         cwork:dateModified ?modified .
+  OPTIONAL { ?creativeWork cwork:shortTitle ?shortTitle . }
+  OPTIONAL { ?creativeWork cwork:description ?description . }
+  OPTIONAL { ?creativeWork cwork:about ?about .
+        OPTIONAL { ?about rdfs:label ?aboutLabel . }
+        OPTIONAL { ?about bbc:shortLabel ?aboutShortLabel . }
+        OPTIONAL { ?about bbc:preferredLabel ?aboutPreferredLabel . }
+     }
+  OPTIONAL {
+         ?creativeWork cwork:mentions ?mentions .
+         OPTIONAL { ?mentions rdfs:label ?mentionsLabel . }
+         OPTIONAL { ?mentions bbc:shortLabel ?mentionsShortLabel . }
+         OPTIONAL { ?mentions bbc:preferredLabel ?mentionsPreferredLabel . }
+     }
+   OPTIONAL { ?creativeWork cwork:dateCreated ?created . }
+   OPTIONAL { ?creativeWork cwork:primaryFormat ?primaryFormat . }
+   OPTIONAL { ?webDocument bbc:primaryContent ?creativeWork .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork bbc:primaryContentOf ?webDocument .
+        OPTIONAL { ?webDocument bbc:webDocumentType ?webDocType . }
+  }
+  OPTIONAL { ?creativeWork cwork:thumbnail ?thumbnail .
+        OPTIONAL { ?thumbnail cwork:altText ?thumbnailAltText . }
+        OPTIONAL { ?thumbnail cwork:thumbnailType ?thumbnailType . }
+  }
+}
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 1. Semantic Publishing Benchmark: Query 1&lt;/p&gt;
+&lt;p&gt;The benchmark test driver is distributed as a jar file, but can also be built using an ant script. It is distributed with the BBC ontologies and reference datasets, the queries and update workloads discussed earlier and the configuration parameters for running the benchmark and for generating the data. It is organised in the following different phases: ontology loading and reference dataset loading, dataset generation and loading, warm up (where a series of aggregation queries are run for a predefined amount of time), benchmark where all queries (aggregation and editorial) are run, conformance checking (that allows one to check whether the employed RDF engine implements OWL reasoning) and finally cleanup that removes all the data from the repository. The benchmark provides a certain degree of freedom where each phase can run independently of the others.&lt;/p&gt;
+&lt;p&gt;The data generator uses an RDF repository to load ontologies and reference datasets; actually, any system that will be benchmarked should have those ontologies loaded.  Any repository that will be used for the data generation should be set up with context indexing, and finally geo-spatial indexing, if available, to serve the spatial queries. The current version of the benchmark has been tested with Virtuoso and OWLIM.&lt;/p&gt;
+&lt;p&gt;The generator uses configuration files that must be configured appropriately to set the values regarding the dataset size to produce, the number of aggregation and editorial agents, the query time out etc. The distributions used by the data generator could also be edited. The benchmark is very simple to run (once the RDF repository used to store the ontologies and the reference datasets is set up, and the configuration files updated appropriately) using the command: java -jar semantic_publishing_benchmark-*.jar test.properties. The benchmark produces three kinds of files that contain (a) brief information about each executed query, the size of the returned result, and the execution time (semantic_publishing_benchmark_queries_brief.log), (b) the detailed log of each executed query and its result (semantic_publishing_benchmark_queries_detailed.log) (c)  the benchmark results (semantic_publishing_benchmark_results.log ).&lt;/p&gt;
+&lt;p&gt;Below we give an example of a run of the benchmark for OWLIM-SE. The benchmark reports the number of edit operations (inserts, updates, and writes) and queries executed at the Nth second of a benchmark run. It also reports that total number of retrieval queries as well as the average number of queries executed per second.&lt;/p&gt;
+&lt;pre tabindex=&#34;0&#34;&gt;&lt;code&gt;Seconds run : 600
+        Editorial:
+                0 agents
+
+                0 operations (0 CW Inserts, 0 CW Updates, 0 CW Deletions)
+                0.0000 average operations per second
+
+        Aggregation:
+                8 agents
+
+                298   Q1   queries
+                267   Q2   queries
+                243   Q3   queries
+                291   Q4   queries
+                320   Q5   queries
+                286   Q6   queries
+                255   Q7   queries
+                274   Q8   queries
+                271   Q9   queries
+
+                2505 total retrieval queries
+                4.1750 average queries per second
+&lt;/code&gt;&lt;/pre&gt;&lt;p&gt;Listing 2. A snippet of semantic_publishing_benchmark_results.log&lt;/p&gt;
+&lt;p&gt;We run the benchmark under the following configuration: we used 8 aggregation agents for query execution and 4 data generator workers all running in parallel. The warm up period is 120 seconds during which a number of aggregation agents is executed to prepare the tested systems for query execution. Aggregation agents run for a period of 600 seconds, and queries timeout after 90 seconds. We used 10 sets of substitution parameters for each query. For data generation, ontologies and reference datasets are loaded in the OWLIM-SE repository. We used OWLIM-SE,  Version 5.4.6287 with Sesame Version 2.6 and Tomcat Version 6. The results we obtained for the 10M, 100M and 1B triple datasets are given in the table below:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;#triples&lt;/th&gt;
+&lt;th&gt;Q1&lt;/th&gt;
+&lt;th&gt;Q2&lt;/th&gt;
+&lt;th&gt;Q3&lt;/th&gt;
+&lt;th&gt;Q4&lt;/th&gt;
+&lt;th&gt;Q5&lt;/th&gt;
+&lt;th&gt;Q6&lt;/th&gt;
+&lt;th&gt;Q7&lt;/th&gt;
+&lt;th&gt;Q8&lt;/th&gt;
+&lt;th&gt;Q9&lt;/th&gt;
+&lt;th&gt;#queries&lt;/th&gt;
+&lt;th&gt;avg. #q. per sec.&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;10M&lt;/td&gt;
+&lt;td&gt;298&lt;/td&gt;
+&lt;td&gt;267&lt;/td&gt;
+&lt;td&gt;243&lt;/td&gt;
+&lt;td&gt;291&lt;/td&gt;
+&lt;td&gt;320&lt;/td&gt;
+&lt;td&gt;286&lt;/td&gt;
+&lt;td&gt;255&lt;/td&gt;
+&lt;td&gt;274&lt;/td&gt;
+&lt;td&gt;271&lt;/td&gt;
+&lt;td&gt;2505&lt;/td&gt;
+&lt;td&gt;41,750&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;100M&lt;/td&gt;
+&lt;td&gt;53&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;51&lt;/td&gt;
+&lt;td&gt;52&lt;/td&gt;
+&lt;td&gt;44&lt;/td&gt;
+&lt;td&gt;62&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;55&lt;/td&gt;
+&lt;td&gt;45&lt;/td&gt;
+&lt;td&gt;449&lt;/td&gt;
+&lt;td&gt;7,483&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;1B&lt;/td&gt;
+&lt;td&gt;34&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;22&lt;/td&gt;
+&lt;td&gt;24&lt;/td&gt;
+&lt;td&gt;25&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;0&lt;/td&gt;
+&lt;td&gt;29&lt;/td&gt;
+&lt;td&gt;28&lt;/td&gt;
+&lt;td&gt;220&lt;/td&gt;
+&lt;td&gt;3,667&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Choke Point Based Benchmark Design</title>
+      <link>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/choke-point-based-benchmark-design/</guid>
+      <description>&lt;p&gt;The &lt;em&gt;Linked Data Benchmark Council&lt;/em&gt; (LDBC) mission is to design and maintain benchmarks for graph data management systems, and establish and enforce standards in running these benchmarks, and publish and arbitrate around the official benchmark results. The council and its &lt;a href=&#34;https://ldbcouncil.org&#34;&gt;https://ldbcouncil.org&lt;/a&gt; website just launched, and in its first 1.5 year of existence, most effort at LDBC has gone into investigating the needs of the field through interaction with the LDBC Technical User Community (&lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;next TUC meeting&lt;/a&gt; will be on October 5 in Athens) and indeed in &lt;em&gt;designing benchmarks&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;So, what makes a good benchmark design? Many talented people have paved our way in addressing this question and for relational database systems specifically the benchmarks produced by &lt;a href=&#34;http://www.tpc.org/&#34;&gt;TPC&lt;/a&gt; have been very helpful in maturing relational database technology, and making it successful. Good benchmarks are &lt;em&gt;relevant&lt;/em&gt; and &lt;em&gt;representative&lt;/em&gt; (address important challenges encountered in practice), &lt;em&gt;understandable&lt;/em&gt; , &lt;em&gt;economical&lt;/em&gt; (implementable on simple hardware), &lt;em&gt;fair&lt;/em&gt; (such as not to favor a particular product or approach), &lt;em&gt;scalable&lt;/em&gt;, &lt;em&gt;accepted&lt;/em&gt; by the community  and &lt;em&gt;public&lt;/em&gt; (e.g. all of its software is available in open source). This list stems from Jim Gray&amp;rsquo;s &lt;a href=&#34;http://research.microsoft.com/en-us/um/people/gray/BenchmarkHandbook/TOC.htm&#34;&gt;Benchmark Handbook&lt;/a&gt;. In this blogpost, I will share some thoughts on each of these aspects of good benchmark design.&lt;/p&gt;
+&lt;p&gt;A very important aspect of benchmark development is making sure that the community &lt;em&gt;accepts&lt;/em&gt; a certain benchmark, and starts using it. A benchmark without published results and therefore opportunity to compare results, remains irrelevant. A European FP7 project is a good place to start gathering a critical mass of support (and consensus, in the process) for a new benchmark from the core group of benchmark designers in the joint work performed by the consortium. Since in LDBC multiple commercial graph and RDF vendors are on the table (Neo Technologies, Openlink, Ontotext and Sparsity) a minimal consensus on &lt;strong&gt;fairness&lt;/strong&gt; had to be established immediately. The Linked Data Benchmark Council itself is a noncommercial, neutral, entity which releases all its benchmark specifications, software, as well as many materials created during the design.  LDBC has spent a lot of time engaging interested parties (mainly through its &lt;a href=&#34;https://ldbcouncil.org/tags/tuc-meeting/&#34;&gt;Technical User Community gatherings&lt;/a&gt;) as well as lining up additional organizations as members of the Linked Data Benchmark Council. There is, in other words, a strong non-technical, human factor in getting benchmarks accepted.&lt;/p&gt;
+&lt;p&gt;The need for &lt;em&gt;understandability&lt;/em&gt; for me means that a database benchmark should consist of a limited number of queries and result metrics. Hence I find TPC-H with its 22 queries more understandable than TPC-DS with its 99, because after (quite some) study and experience it is possible to understand the underlying challnges of all queries in TPC-H. It may also be possible for TPC-DS but the amount of effort is just much larger. Understandable also means for me that a particular query should behave similarly, regardless of the query parameters. Often, a particular query needs to be executed many times, and in order not to play into the hands of simple query caching and also enlarge the access footprint of the workload, different query parameters should be used. However, parameters can strongly change the nature of a query but this is not desirable for the understandability of the workload. For instance, we know that TPC-H Q01 tests raw computation power, as its selection predicate eliminates almost nothing from the main fact table (LINEITEM), that it scans and aggregates into a small 4-tuple result. Using a selection parameter that would select only 0.1% of the data instead, would seriously change the nature of Q01, e.g. making it amendable to indexing. This stability of parameter bindings is an interesting challenge for the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) of LDBC which is not as uniform and uncorrelated as TPC-H. Addressing the challenge of obtaining parameter bindings that have similar execution characteristics will be the topic of a future blog post.&lt;/p&gt;
+&lt;p&gt;The &lt;em&gt;economical&lt;/em&gt; aspect of benchmarking means that while rewarding high-end benchmark runs with higher scores, it is valuable if a meaningful run can also be done with small hardware. For this reason, it is good practice to use a performance-per-EURO (or $) metric, so small installations despite a lower absolute score can still do well on that metric. The economical aspect is right now hurting the (still) leading relational OLTP benchmark TPC-C. Its implementation rules are such that for higher reported rates of throughput, a higher number of warehouses (i.e. larger data size) is needed. In the current day and age of JIT-compiled machinecode SQL procedures and CPU-cache optimized main memory databases, the OLTP throughput numbers now obtainable on modern transactional systems like Hyper on even a single server (it reaches more than 100.000 transactions per second) are so high that they lead to petabyte storage requirements. Not only does this make TPC-C very expensive to run, just by the sheer amount of hardware needed according to the rules, but it also undermines it representativity, since OLTP data sizes encountered in the field are much smaller than OLAP data sizes and do not run in the petabytes.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Representative&lt;/em&gt; benchmarks can be designed by studying or even directly using real workload information, e.g. query logs. A rigorous example of this is the &lt;a href=&#34;http://aksw.org/Projects/DBPSB.html&#34;&gt;DBpedia benchmark&lt;/a&gt; whose workload is based on the query logs of dbpedia.org. However, this SPARQL endpoint is a single public Virtuoso instance that has been configured to interrupt all long running queries, such as to ensure the service remains responsive to as many users as possible. As a result, it is only practical to run small lookup queries on this database service, so the query log only contained solely such light queries. As a consequence, the DBpedia benchmark only tests small SPARQL queries that stress simple B-tree lookups only (and not joins, aggregations, path expressions or inference) and poses almost no technical challenges for either query optimization or execution. The lesson, thus, is to balance representativity with relevance (see later).&lt;/p&gt;
+&lt;p&gt;The fact that a benchmark can be &lt;em&gt;scaled&lt;/em&gt; in size favors the use of synthetic data (i.e. created by a data generator) because data generators can produce any desired quantity of data. I hereby note that in this day and age,  data generators should be parallel. Single-threaded single-machine data generation just becomes unbearable even at terabyte scales. A criticism of synthetic data is that it may not be representative of real data, which e.g. tends to contain highly correlated data with skewed distributions. This may be addressed to a certain extent by injecting specific skew and correlations into synthetic data as well (but: which skew and which correlations?). An alternative is to use real data and somehow blow up or contract the data. This is the approach in the mentioned DBpedia benchmark, though such scaling will distort the original distributions and correlations. Scaling a benchmark is very useful to investigate the effect of data size on the metric, on individual queries, or even in micro-benchmark tests that are not part of the official query set. Typically OLTP database benchmarks have queries whose complexity is O(log(N)) of the data size N, whereas OLAP benchmarks have queries which are linear, O(N) or at most O(N.log(N))  &amp;ndash; otherwise executing the benchmark on large instances is infeasible. OLTP queries thus typically touch little data, in the order of log(N) tuples. In order not to measure fully cold query performance, OLTP benchmarks for that reason need a warmup phase with O(N/log(N)) queries in order to get the system into a representative state.&lt;/p&gt;
+&lt;p&gt;Now, what makes a benchmark &lt;em&gt;relevant&lt;/em&gt;? In LDBC we think that benchmarks should be designed such that crucial areas of functionality are highlighted, and in turn system architects are stimulated to innovate. Either to catch up with competitors and bring the performance and functionality in line with the state-of-the-art but even to innovate and address technical challenges for which until now no good solutions exist, but which can give a decisive performance advantage in the benchmark. Inversely stated, benchmark design can thus be a powerful tool to influence the industry, as a benchmark design may set the agendas for multiple commercial design teams and database architects around the globe. To structure this design process, LDBC introduces the notion of &lt;em&gt;&amp;ldquo;choke points&amp;rdquo;&lt;/em&gt;: by which we mean problems that challenge current technology. These choke points are collected and described early in the LDBC design process, and the workloads developed later are scored in terms of their coverage of relevant choke points. In case of graph data querying, one of the choke points that is unique to the area is recursive Top-N query handling (e.g. shortest path queries). Another choke point that arises is the impact of correlations between attribute value of graph nodes (e.g. both employed by TUM) and the connectivity degree between nodes (the probability to be friends). The notion observed in practice is that people who are direct colleagues, often are in each others friend network. A query that selects people in a social graph that work for the same company, and then does a friendship traversal, may get a bad intermediate result size estimates and therefore suboptimal query plan, if optimizers remain unaware of value/structure correlations. So this is an area of functionality that the Social Network Benchmark (SNB) by LDBC will test.&lt;/p&gt;
+&lt;p&gt;To illustrate what choke points are in more depth, we wrote a &lt;a href=&#34;https://ldbcouncil.org/docs/papers/tpc-h-analyzed-choke-points-tpctc2013.pdf&#34;&gt;paper in the TPCTC 2013&lt;/a&gt; conference that performs a post-mortem analysis of TPC-H and identified 28 such choke points. &lt;em&gt;&lt;a href=&#34;chokepoints.png&#34;&gt;This table&lt;/a&gt;&lt;/em&gt; lists them all, grouped into six Choke Point (CP) areas (CP1 Agregation, CP2 Join, CP3 Locality, CP4 Calculations, CP5 Subqueries and CP6 Parallelism). The classification also shows CP coverage over each of the 22 TPC-H queries (black is high impact, white is no impact):&lt;/p&gt;
+&lt;p&gt;I would recommend reading this paper to anyone who is interested in improving the TPC-H score of a relational database system, since this paper contains the collected experience of three database architects who have worked with TPC-H at length: Orri Erling (of Virtuoso), Thomas Neumann (Hyper,RDF-3X), and me (MonetDB,Vectorwise).  Recently Orri Erling showed that this paper is not complete as he discovered one more choke-point area for TPC-H:  Top-N pushdown. In a detailed blog entry, Orri shows how this technique can &lt;a href=&#34;http://www.openlinksw.com/weblog/oerling/?id=1779&#34;&gt;trivialize Q18&lt;/a&gt;; and this optimization can single handedly improve the overall TPC-score by 10-15%. This is also a lesson for LDBC: even though we design benchmarks with choke points in mind, the queries themselves may bring to light unforeseen opportunities and choke-points that may give rise to yet unknown innovations.&lt;/p&gt;
+&lt;p&gt;LDBC has just published two benchmarks as Public Drafts, which essentially means that you are cordially invited to download and try out the RDF-focused Semantic Publishing Benchmark &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;(SPB)&lt;/a&gt; and the more graph-focused Social Network Benchmark (&lt;a href=&#34;https://ldbcouncil.org/developer/snb&#34;&gt;SNB&lt;/a&gt;),  and &lt;a href=&#34;https://groups.google.com/forum/#!forum/ldbcouncil&#34;&gt;tell us what you think&lt;/a&gt;. Stay tuned for the coming detailed blog posts about these benchmarks, which will explain the graph and RDF processing choke-points that they test.&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;(for more posts from Peter Boncz, see also &lt;a href=&#34;https://databasearchitects.blogspot.com&#34;&gt;Database Architects&lt;/a&gt;, a blog about data management challenges and techniques written by people who design and implement database systems)&lt;/em&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>New Website Online LDBC Benchmarks Reach Public Draft</title>
+      <link>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/new-website-online-ldbc-benchmarks-reach-public-draft/</guid>
+      <description>&lt;p&gt;The Linked Data Benchmark Council  (LDBC) is reaching a milestone today, June 23 2014, in announcing that two of the benchmarks that it has been developing since 1.5 years have now reached the status of Public Draft. This concerns the Semantic Publishing Benchmark (SPB) and the interactive workload of the Social Network Benchmark (SNB). In case of LDBC, the release is staged: now the benchmark software just runs read-only queries. This will be expanded in a few weeks with a mix of read- and insert-queries. Also, query validation will be added later. Watch this blog for the announcements to come, as this will be a matter of weeks to add.&lt;/p&gt;
+&lt;p&gt;The Public Draft stage means that the initial software (data generator, query driver) work and an initial technical specification and documentation has been written. In other words, there is a testable version of the benchmark available for anyone who is interested. Public Draft status does not mean that the benchmark has been adopted yet, it rather means that LDBC has come closer to adopting them, but is now soliciting feedback from the users. The benchmarks will remain in this stage at least until October 6. On that date, LDBC is organizing its fifth &lt;a href=&#34;https://ldbcouncil.org/event/fifth-tuc-meeting&#34;&gt;Technical User Community meeting&lt;/a&gt;. One of the themes for that meeting is collecting user feedback on the Public Drafts; which input will be used to either further evolve the benchmarks, or adopt them.&lt;/p&gt;
+&lt;p&gt;You can also see that we created a this new website and a new logo. This website is different from &lt;code&gt;http://ldbc.eu&lt;/code&gt; that describes the EU project which kick-starts LDBC. The ldbcouncil.org is a website maintained by the Linked Data Benchmark Council legal entity, which will live on after the EU project stops (in less than a year). The Linked Data Benchmark Council is an independent, impartial, member-sustained organization dedicated to the creation of RDF and graph data management benchmarks and benchmark practices.&lt;/p&gt;
+&lt;p&gt;In the next weeks, you will see many contributors in LDBC post items on this blog. Some of these blog entries will be very technical, others not, but all aim to explain what LDBC is doing for RDF and graph benchmarking, and why.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Social Network Benchmark Goals</title>
+      <link>https://ldbcouncil.org/post/social-network-benchmark-goals/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/social-network-benchmark-goals/</guid>
+      <description>&lt;p&gt;Social Network interaction is amongst the most natural and widely spread activities in the internet society, and it has turned out to be a very useful way for people to socialise at different levels (friendship, professional, hobby, etc.). As such, Social Networks are well understood from the point of view of the data involved and the interaction required by their actors. Thus, the concepts of friends of friends, or retweet are well established for the data attributes they represent, and queries such as “find the friend of a specified person who has long worked in a company in a specified country” are natural for the users and easy to understand from a functional point of view.&lt;/p&gt;
+&lt;p&gt;From a totally different perspective, Social Networks are challenging technologically, being part of the Big Data arena, and require the execution of queries that involve complex relationship search and data traversal computations that turn out to be choke points for the data management solutions in the market.&lt;/p&gt;
+&lt;p&gt;With the objective of shaping a benchmark which is up to date as a use case, well understood by everybody and poses significant technological challenges, the LDBC consortium decided to create the Social Network Benchmark, &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;SNB&lt;/a&gt;, which is eventually going to include three workloads: the Interactive, the Business Intelligence and the Analytical. Those workloads are going to share a unique synthetic data generation tool that will mimic the data managed by real Social Networks.&lt;/p&gt;
+&lt;p&gt;The SNB data generator created by LDBC is an evolution of the S3G2 data generator and can be found at the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;LDBC Github repository&lt;/a&gt;. The data generator is unique because it generates data that contains realistic distributions and correlations among variables that were not taken into consideration before. It also allows generating large datasets because it uses a Hadoop based implementation to compute the complex data generated. The SNB data generator has already been used in different situations like the &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD programming contest 2014&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The SNB presents the Interactive workload as first of a breed with the objective to resemble the queries that users may place to a Social Network portal. Those are a combination of read and write small queries that express the needs of a user who is interacting with her friends and connections through the Social Network. Queries like that explained above (Q12 in the workload) are examples that set up choke points like pattern recognition or full traversals.&lt;/p&gt;
+&lt;p&gt;More details will be given in blogs to follow both for the data generator as well as for the specific characteristics of the workloads allowing the users to obtain a first contact with the benchmarks.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Welcome to the New Industry Oriented LDBC Organisation for Benchmarking RDF and Graph Technologies</title>
+      <link>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</link>
+      <pubDate>Tue, 14 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/welcome-to-the-new-industry-oriented-ldbc-organisation-for-benchmarking-rdf-and-graph-technologies/</guid>
+      <description>&lt;p&gt;It is with great pleasure that we announce the new LDBC organisation site at &lt;a href=&#34;https://www.ldbcouncil.org&#34;&gt;www.ldbcouncil.org&lt;/a&gt;. The LDBC started as a European Community FP7 funded project with the objective to create, foster and become an industry reference for benchmarking RDF and Graph technologies. A period of more than one and a half years has led us to the creation of the first two workloads, the Semantic Publishing Benchmark and the Social Network Benchmark in its interactive workload, which you will find in the &lt;em&gt;benchmarks&lt;/em&gt; menu on this site.&lt;/p&gt;
+&lt;p&gt;Those benchmarks will allow all the actors in the RDF and Graph industry to know who is who and how the different technology players are reacting to the results of their competing industry companies. Thus, the users will have results to compare the technologies and vendors will have a clear idea of how their products evolve compared to other vendors, all with the objective to foster the technological growth of the RDF and Graph arena.&lt;/p&gt;
+&lt;p&gt;While the main objective of LDBC is to create benchmarks, we know that we need a strong community to grow and evolve those benchmarks taking into consideration all the market and technology needs. With this objective, we have created a special section to engage all the interested community through a blog, forums to discuss interesting issues and a lot of information on benchmarking, including links to other benchmarks, pointers to interesting conferences and venues and all the publications on benchmarking RDF and Graph technologies.&lt;/p&gt;
+&lt;p&gt;We want to make sure that we all know what benchmarking and the LDBC effort means, both historically, and from the global needs perspective. To make sure that this is accomplished, we set up a section open to the public with in depth explanations of the history of industry benchmarking, LDBC and why our society needs such efforts globally.&lt;/p&gt;
+&lt;p&gt;Finally, we want to invite you to our Fifth Technical Users Community (TUC) meeting to be held in Athens next Monday Oct. 6th 2014. This event will have as its main objective to allow for presentations on experiences with the two already released benchmarks, SNB and SPB. You’ll find updated information here.&lt;/p&gt;
+&lt;p&gt;In all, we expect that the LDBC organisation site engages all of you and that the growth of RDF and Graph technologies in the future is secured by the benchmarks fostered by us.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>2nd International Workshop on Benchmarking RDF Systems</title>
+      <link>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/2nd-international-workshop-on-benchmarking-rdf-systems/</guid>
+      <description>&lt;p&gt;Following the 1st International workshop on Benchmarking RDF Systems (BeRSys 2013) the aim of the BeRSys 2014 workshop is to provide a discussion forum where researchers and industrials can meet to discuss topics related to the performance of RDF systems. BeRSys 2014 is the only workshop dedicated to benchmarking different aspects of RDF engines - in the line of TPCTC series of workshops.The focus of the workshop is to expose and initiate discussions on best practices, different application needs and scenarios related to different aspects of RDF data management.&lt;/p&gt;
+&lt;p&gt;More at: &lt;a href=&#34;http://events.sti2.at/bersys2014/&#34;&gt;http://events.sti2.at/bersys2014/&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>DATAGEN: Data Generation for the Social Network Benchmark</title>
+      <link>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/</guid>
+      <description>&lt;p&gt;As explained in a previous post, the LDBC Social Network Benchmark (LDBC-SNB) has the objective to provide a realistic yet challenging workload, consisting of a social network and a set of queries. Both have to be realistic, easy to understand and easy to generate. This post has the objective to discuss the main features of DATAGEN, the social network data generator provided by LDBC-SNB, which is an evolution of S3G2 &lt;a href=&#34;#references&#34;&gt;[1]&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;One of the most important components of a benchmark is the dataset. However, directly using real data in a benchmark is not always possible. On the one hand, it is difficult to find data with all the scaling characteristics the benchmark requires. On the other hand, collecting real data can be expensive or simply not possible due to privacy concerns.&lt;/p&gt;
+&lt;p&gt;For these reasons, LDBC-SNB provides DATAGEN which is the synthetic data generator responsible for generating the datasets for the three LDBC-SNB workloads: the Interactive, the Business Intelligence and the Analytical. DATAGEN has been carefully designed with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Realism.&lt;/strong&gt; The data generated by DATAGEN has to mimic the features of those found in a real social network. In DATAGEN, output attributes, cardinalities, correlations and distributions have been finely tuned to reproduce a real social network in each of its aspects. DATAGEN is aware of the data and link distributions found in a real social network such as Facebook &lt;a href=&#34;#references&#34;&gt;[2]&lt;/a&gt;. Also, it uses real data from DBPedia, such as property dictionaries, which ensure that the content is realistic and correlated.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Scalability.&lt;/strong&gt; Since LDBC-SNB is targeting systems of different scales and budgets, DBGEN must be capable of generating datasets of different sizes, from a few Gigabytes to Terabytes. DATAGEN is implemented following the MapReduce paradigm, allowing for the generation of large datasets on commodity clusters.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Determinism.&lt;/strong&gt; DATAGEN is deterministic regardless of the number of cores/machines used to produce the data. This important feature guarantees that all Test Sponsors will face the same dataset, thus, making the comparisons between different systems fair and the benchmarks’ results reproducible.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Usability.&lt;/strong&gt; LDBC-SNB has been designed to have an affordable entry point. As such, DATAGEN has been severely influenced by this philosophy, and therefore it has been designed to be as easy to use as possible.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Finally, the area of action of DATAGEN is not only limited to the scope of LDBC-SNB. Several researchers and practitioners are already using DATAGEN in a wide variety of situations. If you are interested on the internals and possibilities of DATAGEN, please visit its official repository (&lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen)&#34;&gt;https://github.com/ldbc/ldbc_snb_datagen)&lt;/a&gt;.&lt;/p&gt;
+&lt;h4 id=&#34;references&#34;&gt;References&lt;/h4&gt;
+&lt;p&gt;[1] Pham, Minh-Duc, Peter Boncz, and Orri Erling. &amp;ldquo;S3g2: A scalable structure-correlated social graph generator.&amp;rdquo; Selected Topics in Performance Evaluation and Benchmarking. Springer Berlin Heidelberg, 2013. 156-172.&lt;/p&gt;
+&lt;p&gt;[2] Prat-Pérez, Arnau, and David Dominguez-Sal. &amp;ldquo;How community-like is the structure of synthetically generated graphs?.&amp;rdquo; Proceedings of Workshop on GRAph Data management Experiences and Systems. ACM, 2014.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Getting Started With SNB</title>
+      <link>https://ldbcouncil.org/post/getting-started-with-snb/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/getting-started-with-snb/</guid>
+      <description>&lt;p&gt;In a previous blog post titled &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/&#34;&gt;Is SNB like Facebook&amp;rsquo;s LinkBench?&lt;/a&gt;&amp;rdquo;, Peter Boncz discusses the design philosophy that shapes SNB and how it compares to other existing benchmarks such as LinkBench. In this post, I will briefly introduce the essential parts forming SNB, which are DATAGEN, the LDBC execution driver and the workloads.&lt;/p&gt;
+&lt;h3 id=&#34;datagen&#34;&gt;DATAGEN&lt;/h3&gt;
+&lt;p&gt;DATAGEN is the data generator used by all the workloads of SNB. &lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark/&#34;&gt;Here&lt;/a&gt; we introduced the design goals that drive the development of DATAGEN, which can be summarized as: &lt;em&gt;Realism, Scalability, Determinism and Usability.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;DATAGEN produces datasets with the following schema, in terms of entities and their relations. Data generated represents a snapshot of the activity of a social network similar to real social networks such as Facebook, during a period of time. Data includes entities such as Persons, Organizations, and Places. The schema also models the way persons interact, by means of the friendship relations established with other persons, and the sharing of content such as messages (both textual and images), replies to messages and likes to messages. People form groups to talk about specific topics, which are represented as tags.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;schema.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;For the sake of credibility, data produced by DATAGEN has to be realistic. In this sense, data produced by DATAGEN not only has a realistic schema, but also pays attention to the following items:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Realistic distributions. The degree distribution of friendship relationships has been modeled to reproduce that found in the Facebook graph. Also, other distributions such as the number of replies to a post, the number of persons per country or the popularity of a tag has been realistically modeled either using known distributions or data extracted from real sources such as Dbpedia.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Correlated attributes and relations. Attribute values are not chosen at random, but follow correlations. For instance, people from a specific country have a larger probability to have names typical from that country, to work on companies from that country or to study at universities of that country. Also, we DATAGEN implements a relationship creation process that tries to reproduce the homophily principle, that is, people with similar characteristics tend to be connected.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;DATAGEN is built on top of Hadoop, to generate datasets of different sizes. It works either on single node SMP machines or a cluster environment. DATAGEN supports different output formats targeting different systems. On the one hand, we have the CSV format, where each entity and relation is output into a different comma separated value file. On the other hand, it also supports the Turtle format for RDF systems.&lt;/p&gt;
+&lt;p&gt;Finally, DATAGEN outputs two other things:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Update Streams, which will be used in the future to implement updates in the workloads.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Substitution parameters, which are the parameters of the query instances the LDBC driver will issue. These are select so the query plans of the resulting query executions do not differ significantly.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Configuring and using DATAGEN is easy. Please visit &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen&#34;&gt;this page&lt;/a&gt; for more information.&lt;/p&gt;
+&lt;h3 id=&#34;ldbc-driver&#34;&gt;LDBC driver&lt;/h3&gt;
+&lt;p&gt;SNB is designed to be as easier to adopt as possible. Therefore, SNB provides the LDBC execution driver, which is designed to automatically generated the benchmark workload and gather the benchmark results. It then generates a stream of operations in conformance with a workload definition, and executes those operations against some system using the provided database connector, and with the substitution parameters produced by DATAGEN. During execution, the driver continuously measures performance metrics, then upon completion it generates a report of those metrics.&lt;/p&gt;
+&lt;p&gt;It is capable of generating parallel workloads (e.g. concurrent reads and writes), while respecting the configured operation mix and ensuring that ordering between dependent operations is maintained. For further details on how the driver achieves that, please visit the Documentation &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki&#34;&gt;page&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;The test sponsor (aka the implementer of the benchmark), has to provide a set of implemented interfaces, that form a benchmark implementation to plug into the driver, and then the benchmark is automatically executed.&lt;/p&gt;
+&lt;p&gt;Given a workload consisting of a series of &lt;em&gt;Operations&lt;/em&gt;, the test sponsor implements &lt;em&gt;OperationHandlers&lt;/em&gt; __ for them. &lt;em&gt;OperationHandlers&lt;/em&gt; are responsible of executing instances of an specific operation (query) type. This is done by overriding the method &lt;em&gt;executeOperation&lt;/em&gt;(), which receives as input parameter an &lt;em&gt;Operation&lt;/em&gt; instance and returns the result. From &lt;em&gt;Operation&lt;/em&gt; __ instance, the operation&amp;rsquo;s input parameters can be retrieved, as well as the database connection state.&lt;/p&gt;
+&lt;p&gt;The database connector is used to initialize, cleanup and get the database connection state. The database connector must implement the &lt;em&gt;Db&lt;/em&gt; interface, which consists of three methods: &lt;em&gt;onInit&lt;/em&gt;(), &lt;em&gt;onCleanup&lt;/em&gt;() and &lt;em&gt;getConnectionState&lt;/em&gt;(). &lt;em&gt;onInit&lt;/em&gt;() is called before the benchmark is executed, and is responsible of initializing the database and registering the different &lt;em&gt;OperationHandlers&lt;/em&gt;. &lt;em&gt;onCleanup&lt;/em&gt;() is called after the benchmark has completed. Any resources that need to be released should be released here.&lt;/p&gt;
+&lt;p&gt;Finally, &lt;em&gt;getConnectionState&lt;/em&gt;() returns an instance of &lt;em&gt;DbConnectionState&lt;/em&gt;, which encapsulates any state that needs to be shared between &lt;em&gt;OperationHandler&lt;/em&gt; instances. For instance, this state could contain the necessary classes used to execute a given query for the implementing system.&lt;/p&gt;
+&lt;p&gt;A good example on how to implement the benchmark can be found &lt;a href=&#34;https://github.com/ldbc/ldbc_driver/wiki/Implementing%20a%20Database%20Connector&#34;&gt;here&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;workloads&#34;&gt;Workloads&lt;/h3&gt;
+&lt;p&gt;Currently, LDBC has only released the first draft of the Interactive workload, but the business intelligence and analytical workloads are on the works. Workloads are designed to mimic the different usage scenarios found in operating a real social network site, and each of them targets one or more types of systems. Each workload defines a set of queries and query mixes, designed to stress the systems under test in different choke-point areas, while being credible and realistic.&lt;/p&gt;
+&lt;p&gt;Interactive workload reproduces the interaction between the users of the social network by including lookups and transactions that update small portions of the data base. These queries are designed to be interactive and target systems capable of responding such queries with low latency for multiple concurrent users. Examples of Interactive queries are, given a user, retrieve those friends with a specific name, or finding the most recent post and comments created by your friends.&lt;/p&gt;
+&lt;p&gt;Business Intelligence workload, will represent those business intelligence analytics a social network company would like to perform in the social network, in order to take advantage of the data to discover new business opportunities. This workload will explore moderate portions of data from different entities, and will perform more complex and data intensive operations compared to the Interactive ones.&lt;/p&gt;
+&lt;p&gt;Examples of possible Business Intelligence queries could be finding trending topics in country in a given moment, or looking for fraudulent “likers”.&lt;/p&gt;
+&lt;p&gt;Finally, the Analytical workload will aim at exploring the characteristics of the underlying structure of the network. Shortest paths, community detection or centrality, are representative queries of this workload, and will imply touching a vast amount of the dataset.&lt;/p&gt;
+&lt;h3 id=&#34;final-remarks&#34;&gt;Final remarks&lt;/h3&gt;
+&lt;p&gt;This is just a quick overview of the SNB benchmark. For a more detailed description, do not hesitate to read the official SNB specification &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_docs&#34;&gt;draft&lt;/a&gt;, and stay tunned to the LDBC blog for future blog posts detailing all of the SNB parts in depth.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Introducing SNB Interactive, the LDBC Social Network Benchmark Online Workload</title>
+      <link>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/introducing-snb-interactive-the-ldbc-social-network-benchmark-online-workload/</guid>
+      <description>&lt;p&gt;The LDBC Social Network Benchmark (SNB) is composed of three distinct workloads, interactive, business intelligence and graph analytics. This post introduces the interactive workload.&lt;/p&gt;
+&lt;p&gt;The benchmark measures the speed of queries of medium complexity against a social network being constantly updated. The queries are scoped to a user&amp;rsquo;s social environment and potentially access data associated with the friends or a user and their friends.&lt;/p&gt;
+&lt;p&gt;This is representative of an operational application. This goes beyond OLTP (On Line Transaction Processing) by having substantially more complex queries touching much more data than the point lookups and short reports in TPC-C or E. The emphasis is presenting a rich and timely view of a constantly changing environment.&lt;/p&gt;
+&lt;p&gt;SNB Interactive gives end users and application developers a reference workload for comparing the relative merits of different technologies for graph data management. These range from dedicated graph databases to RDF stores and relational databases. There are graph serving benchmarks such as the Facebook Linkbench but SMB Interactive goes well beyond this in richness of schema and queries.&lt;/p&gt;
+&lt;p&gt;The challenge to implementors is handling the user facing logic of a social network in a single system as the scale increases. The present practice in large social networks is massive sharding and use of different SQL and key value stores for different aspects of the service. The SNB workload is not intended to replicate this situation but to look for ways forward, so that one system can keep up with transactions and offer user rich and varied insight into their environment. The present practice relies on massive precomputation but SNB interactive seeks more agility and adhoc capability also on the operational side.&lt;/p&gt;
+&lt;p&gt;The dataset is scaled in buckets, with distinct scales for 10, 30, 100, 300GB and so forth. A 100GB dataset has approximately 500,000 simulated users with their connections and online history. This is a convenient low-end single server size while 500 million users is 100TB, which is a data center scale requiring significant scale-out.&lt;/p&gt;
+&lt;p&gt;The metric is operations per minute at scale. Online benchmarks typically have a fixed ratio between throughput and dataset size. Here we depart from this, thus one can report arbitrarily high throughputs at any scale. This makes main memory approaches feasible, which corresponds to present online practices.  The benchmark makes transactions and queries on a simulated timeline of social interactions. The challenge for the systm is to run this as fast as possible at the  selected  scale while providing fast and predictable response times. Throughput can be increased at the cost of latency but here the system must satisfy response time criteria while running at the reported throughput.&lt;/p&gt;
+&lt;p&gt;Different technologies can be used for implementing SNB interactive. The workload is defined in natural language with sample implementations in SPARQL and Cypher. Other possibilities include SQL and graph database API&amp;rsquo;s.&lt;/p&gt;
+&lt;p&gt;SNB Interactive is an example of LDBC&amp;rsquo;s choke point driven design methodology, where we draw on the combined knowledge and experience of several database system architects for defining realistic, yet ambitious challenges whose solution will advance the state of the art&lt;/p&gt;
+&lt;p&gt;The benchmark specification and associated tools are now offered for public feedback. The LDBC partners working on SNB nteractive will provide sample implementations of the workload on their systems, including Virtuoso, Neo4J and Sparsity. Specifics of availability and coverage may vary.&lt;/p&gt;
+&lt;p&gt;Subsequent posts will address the workload in more detail.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Is SNB Like Facebooks LinkBench</title>
+      <link>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/is-snb-like-facebooks-linkbench/</guid>
+      <description>&lt;p&gt;In this post, I will discuss in some detail the rationale and goals of the design of the &lt;a href=&#34;https://ldbcouncil.org/benchmarks/snb&#34;&gt;Social Network Benchmark&lt;/a&gt; (SNB) and explain how it relates to real social network data as in Facebook, and in particular FaceBook&amp;rsquo;s own graph benchmark called &lt;a href=&#34;https://www.facebook.com/notes/facebook-engineering/linkbench-a-database-benchmark-for-the-social-graph/10151391496443920&#34;&gt;LinkBench&lt;/a&gt;. We think SNB is the most intricate graph database benchmark to date (it&amp;rsquo;s also available in RDF!), that already has made some waves. SNB recently received praise at the most important database systems conference &lt;a href=&#34;http://www.sigmod2014.org/&#34;&gt;SIGMOD in Snowbird&lt;/a&gt; after being used for this year&amp;rsquo;s &lt;a href=&#34;https://arxiv.org/pdf/2010.12243.pdf&#34;&gt;ACM SIGMOD Programming Contest&lt;/a&gt;, which was about graph analytics.&lt;/p&gt;
+&lt;p&gt;SNB is intended to provide the following &lt;strong&gt;value&lt;/strong&gt; to different stakeholders:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;For end users facing graph processing tasks, SNB provides a recognizable scenario against which it is possible to &lt;em&gt;compare merits of different products&lt;/em&gt; and technologies.  By covering a wide variety of scales and price points, SNB can serve as an aid to technology selection.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For vendors of graph database technology, SNB provides a &lt;em&gt;checklist of features&lt;/em&gt; and performance characteristics that helps in product positioning and can serve to guide new development.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;For researchers, both industrial and academic, the SNB dataset and workload provide &lt;em&gt;interesting challenges&lt;/em&gt; in multiple technical areas, such as query optimization, (distributed) graph analysis, transactional throughput, and provides a way to objectively compare the effectiveness and efficiency of new and existing technology in these areas.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;I should clarify that even though the data model of SNB resembles Facebook (and we&amp;rsquo;re extending it to also look more like Twitter), the goal of SNB is not to advise Facebook or Twitter what systems to use, they don&amp;rsquo;t need LDBC for that. Rather, we take social network data as a model for the much more broader graph data management problems that IT practitioners face. The particular characteristic of a graph data management problem is that the queries and analysis is not just about finding data by value, but about learning about the &lt;em&gt;connection patterns&lt;/em&gt; between data. The scenario of the SNB, a social network, was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;the benchmark scenario should be &lt;strong&gt;understandable&lt;/strong&gt; to a large audience, and this audience should also understand the relevance of managing such data.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the scenario in the benchmark should cover the complete range of challenges &lt;strong&gt;relevant&lt;/strong&gt; for graph data management, according to the benchmark scope.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;the query challenges in it should be &lt;strong&gt;realistic&lt;/strong&gt; in the sense that, though synthetic, similar data and workloads are encountered in practice.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The SNB is in fact three distinct benchmarks with a common dataset, since there are &lt;em&gt;three different workloads&lt;/em&gt;. Each workload produces a single metric for performance at the given scale and a price/performance metric at the scale.  The full disclosure further breaks down the composition of the metric into its constituent parts, e.g. single query execution times.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Interactive Workload.&lt;/strong&gt;  The Interactive SNB workload is the first one we are releasing. It is defined in plain text, yet we have example implementations in Neo4j&amp;rsquo;s Cypher, SPARQL and SQL. The interactive workloads tests a system&amp;rsquo;s throughput with relatively simple queries with concurrent updates.  The system under test (SUT) is expected to run in a steady state, providing durable storage with smooth response times.  Inserts are typically small, affecting a few nodes at a time, e.g. uploading of a post and its tags.  Transactions may require serializability, e.g. verifying that something does not exist before committing the transaction.   Reads do not typically require more than read committed isolation. One could call the Interactive Workload an OLTP workload, but while queries typically touch a small fraction of the database, this can still be up to hundreds of thousands of values (the two-step neighborhood of a person in the social graph, often). Note that in order to support the read-queries, there is a lot of liberty to create indexing structures or materialized views, however such structures need to be maintained with regards to the continues inserts that also part of the workload. This workload is now in draft stage, which means that the &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt; and  &lt;a href=&#34;https://github.com/ldbc/ldbc_driver&#34;&gt;driver software stack&lt;/a&gt; are ready and the purpose is to obtain user feedback, as well as develop good system implementations.  The first implementations of this workload are now running on Openlink Virtuoso, Neo4j and Sparsity Sparksee, and we are eager to see people try these, and optimize and involve these.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Business Intelligence Workload.&lt;/strong&gt; There is a first stab at this workload formulated in SPARQL, tested against Openlink Virtuoso. The BI workload consists of complex structured queries for analyzing online behavior of users for marketing purposes.  The workload stresses query execution and optimization. Queries typically touch a large fraction of the data and do not require repeatable read.  The queries will be concurrent with trickle load (not out yet). Unlike the interactive workload, the queries touch more data as the database grows.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;&lt;strong&gt;Graph Analytics Workload.&lt;/strong&gt; This workload is not yet available. It will test the functionality and scalability of the SUT for graph analytics that typically cannot be expressed in a query language. As such it is the natural domain for graph programming frameworks like Giraph. The workload is still under development, but will consist of algorithms like PageRank, Clustering and Breadth First Search. The analytics is done on most of the data in the graph as a single operation.  The analysis itself produces large intermediate results.  The analysis is not expected to be transactional or to have isolation from possible concurrent updates.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All the SNB scenarios share a common scalable synthetic data set, generated by a state-of-the art &lt;a href=&#34;https://github.com/ldbc/ldbc_socialnet_bm/tree/master/ldbc_socialnet_dbgen&#34;&gt;data generator&lt;/a&gt;. We strongly believe in a single dataset that makes sense for all workloads, that is, the interactive and BI workloads will traverse data that has sensible PageRank outcomes, and graph clustering structure, etc. This is in contrast to &lt;a href=&#34;http://people.cs.uchicago.edu/~tga/pubs/sigmod-linkbench-2013.pdf&#34;&gt;LinkBench&lt;/a&gt;, released by the team of Facebook that manages the OLTP workload on the Facebook Graph, which closely tunes to the &lt;strong&gt;low-level&lt;/strong&gt; MySQL query patterns Facebook sees, but whose graph structure does not attempt to be realistic beyond average out degree of the nodes (so, it makes no attempts to create realistic community patterns or correlations) . The authors of LinkBench may be right that  the graph structure does not make a difference for simple insert/update/delete/lookup actions which LinkBench itself tests, but for the SNB queries in the Interactive and BI workloads this is not true. Note that &lt;a href=&#34;http://borthakur.com/ftp/sigmod2013.pdf&#34;&gt;Facebook&amp;rsquo;s IT infrastructure&lt;/a&gt; does not store all user data in MySQL and its modified memcached (&amp;quot;&lt;a href=&#34;http://www.cs.cmu.edu/~pavlo/courses/fall2013/static/papers/11730-atc13-bronson.pdf&#34;&gt;TAO&lt;/a&gt;&amp;quot;), some of it ends up in separate subsystems (using HDFS and HBase), which is outside of the scope of LinkBench. However, for queries like in the SNB Interactive and BI workloads it &lt;strong&gt;does&lt;/strong&gt; matter how people are connected, and how the attribute values  of connected people correlate. In fact, the SNB data generator is unique in that it generates a huge graph with &lt;em&gt;correlations&lt;/em&gt;, where people who live together, have the same interests or work for the same company have greater chance to be connected, and people from Germany have mostly German names, etc. Correlations frequently occur in practice and can strongly influence the quality of query optimization and execution, therefore LDBC wants to test their effects on graph data management systems (the impact of correlation among values and structure on query optimization and execution are a &amp;ldquo;choke point&amp;rdquo; for graph data management system where LDBC wants to stimulate innovation).&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Making It Interactive</title>
+      <link>https://ldbcouncil.org/post/making-it-interactive/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/making-it-interactive/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Synopsis:&lt;/em&gt; Now is the time to finalize the interactive part of the Social Network Benchmark (SNB). The benchmark must be both credible in a real social network setting and pose new challenges. There are many hard queries but not enough representation for what online systems in fact do. So, the workload mix must strike a balance between the practice and presenting new challenges.&lt;/p&gt;
+&lt;p&gt;It is about to be showtime for LDBC. The initial installment of the LDBC Social Network Benchmark (SNB) is the full data generator, test driver, workload and reference implementation for the interactive workload. SNB will further acquire business intelligence and graph analytics workloads but this post is about the interactive workload.&lt;/p&gt;
+&lt;p&gt;As part of finalizing the interactive workload, we need to determine precise mixes of the component queries and updates. We note that the interactive mix so far consists of very heavy queries. These touch, depending on the scale upwards of a million entities in the database.&lt;/p&gt;
+&lt;p&gt;Now, rendering a page view in a social network site does not touch millions of entities. The query that needs to be correct and up to date touches tens or hundreds of entities, e.g. posts or social connections for a single page impression. There are also statistical views like the count of people within so many steps or contact recommendations but these are not real time and not recalculated each time they are shown.&lt;/p&gt;
+&lt;p&gt;So, LDBC SNB has a twofold task:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;In order to be a credible interactive workload, it must in fact have characteristics of one&lt;/li&gt;
+&lt;li&gt;In order to stimulate progress it must have queries that are harder than those that go in routine page views but are still not database-wide analytics.&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;Designing a workload presents specific challenges:&lt;/p&gt;
+&lt;ol&gt;
+&lt;li&gt;The workload must be realistic enough for users to identify with it.&lt;/li&gt;
+&lt;li&gt;The workload must pose challenges and drive innovation in a useful direction.&lt;/li&gt;
+&lt;li&gt;The component operations must all play a noticeable role in it.  If the operation&amp;rsquo;s relative performance doe does not affect the score, why is it in the workload?&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;The interactive mix now has 14 queries that are interesting from a query optimization and execution viewpoint but touch millions of entities. This is not what drives page inpressions in online sites. Many users of GDB and RDF are about online sites, so this aspect must not be ignored.&lt;/p&gt;
+&lt;p&gt;Very roughly, the choke points (technical challenges) of SNB interactive are as follows:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Random access - Traversing between people, content makes large numbers of random lookups. These can be variously parallelized and/or vectored.&lt;/li&gt;
+&lt;li&gt;Query optmization must produce right plans - The primary point isjoin order and join type.  Index vs. hash based joins have very different performance properties and the right choice depends on corectly guessing the number of rows and of distinct keys on either side of the join.&lt;/li&gt;
+&lt;li&gt;When doing updates and lookups, the execution plan is obvious but there the choke point is the scheduling of large numbers of short operations.&lt;/li&gt;
+&lt;li&gt;Many queries have aggregation, many have distinct, all have result ordering and a limit on result count. The diverse interactions of these operators produce optimization opportunities.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Dreaming up a scenario and workload is not enough for a benchmark. There must also be a strong indication that the job is do-able and plausible in the scenario.&lt;/p&gt;
+&lt;p&gt;In online benchmarks different operations have different frequencies and the operations are repeated large numbers of times. There is a notion of steady state, so that the reported result represents a level of performance a system can sustain indefinitely.&lt;/p&gt;
+&lt;p&gt;A key part of the workload definition is the workload mix, i.e. the relative frequencies of the operations. This decides in fact what the benchmark measures.&lt;/p&gt;
+&lt;p&gt;The other aspect is the metric, typically some variation on operations per unit of time.&lt;/p&gt;
+&lt;p&gt;All these are interrelated. Here we can take clicks per second as a metric, which is easy to understand. We wish to avoid the pitfall of TPC-C which ties the metric to a data size, so that for a high metric one must have a correspondingly larger database. This rule makes memory-only implementations in practice unworkable, while in reality many online systems in fact run from memory. So, here we scale in buckets, like in TPC-H but we still have an online workload. The scenario of the benchmark has its own timeline, here called simulation time. A benchmark run produces events in the simulation time but takes place in real time. This defines an accelration ratio. For example we could say that a system does 1000 operations per second at 300G scale, with an acceleration of 7x, i.e. 7 hours worth of simulation time are done in one hour of real time. A metric of this form is directly understandable for sizing a system, as long as the workload mix is realistic. We note that online sites usually are provisioned so that servers do not run anywhere near their peak throughput at a busy time.&lt;/p&gt;
+&lt;p&gt;So how to define the actual mix? By measuring. But measuring requires a reference implementation that is generally up to date for the database science of the time and where the individual workload pieces are implemented in a reasonable manner, so no bad query plans or bad schema design. For the reference implementation, we use Virtuoso column store in SQL.&lt;/p&gt;
+&lt;p&gt;But SQL is not graphy! Why not SPARQL? Because SPARQL has diverse fixed overheads and this is not a RDF-only workload. We do not want SPARQL overheads to bias the metric, we just want an implementation where we know exactly what goes on and how it works, with control of physical data placement so we know there are no obvious stupidities in any of this. SPARQL will come. Anyway, as said elsewhere, we believe that SPARQL will outgrow its overheads, at which point SQL or SPARQL is a matter of esthetic preference.  For now, it is SQL and all we want is transparency into the metal.&lt;/p&gt;
+&lt;p&gt;Having this, we peg the operation mix to the update stream generated by the data generator. At the 30G scale, there are 3.5M new posts/replies per month of simulation time.  For each such, a query mix will be run, so as to establish a realistic read/write ratio. The query mix will have fractional queries, for example 0.2 friends recommendations per new post, but that is not a problem, since we run large numbers of these and at the end of the run can check that the ratios of counts are as expected.  Next, we run this as fast as it will go on the test system. Then we adjust the ratio of short and long queries to get two objectives:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Short queries should collectively be about 45% of the CPU load.&lt;/li&gt;
+&lt;li&gt;Updates will be under 5%&lt;/li&gt;
+&lt;li&gt;Long queries will take up the rest.  For long queries, we further tune the relative frequencies so that each represents a roughly equal slice of the time. Having a query that does not influence the metric is useless, so each gets enough showtime to have an impact but by their nature some are longer than others.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The reason why short queries should have a large slice is the fact that this is so in real interactive systems. The reason why long queries are important is driving innovation.  Like this we get both scheduling (short lookup/update) and optimization choke points covered. As a bonus be make the mix so that we get a high metric, so many clicks per second, since this is what the operator of an online site wants.&lt;/p&gt;
+&lt;p&gt;There is a further catch: Different scales have different degrees of the friends graph and this will have a different influence on different queries.  To see whether this twists the metric out of shape we must experiment. For example, one must not have ogarithmic and linear complexity queries in the same mix, as BSBM for example has. So this is to be kept in mind as we proceed.&lt;/p&gt;
+&lt;p&gt;In the next post we will look at the actual mix and execution times on the test system.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>SNB Data Generator - Getting Started</title>
+      <link>https://ldbcouncil.org/post/snb-data-generator-getting-started/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/snb-data-generator-getting-started/</guid>
+      <description>&lt;p&gt;In previous posts (&lt;a href=&#34;https://ldbcouncil.org/post/datagen-data-generation-for-the-social-network-benchmark&#34;&gt;this&lt;/a&gt; and &lt;a href=&#34;https://ldbcouncil.org/post/getting-started-with-snb&#34;&gt;this&lt;/a&gt;) we briefly introduced the design goals and philosophy behind DATAGEN, the data generator used in LDBC-SNB. In this post, I will explain how to use DATAGEN to generate the necessary datatsets to run LDBC-SNB. Of course, as DATAGEN is continuously under development,  the instructions given in this tutorial might change in the future.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-hadoop&#34;&gt;Getting and Configuring Hadoop&lt;/h3&gt;
+&lt;p&gt;DATAGEN runs on top of hadoop 1.2.1  to be scale. You can download it from here. Open a console and type the following commands to decompress hadoop into /home/user folder:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz hadoop-1.2.1.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For simplicity, in this tutorial we will run DATAGEN in standalone mode, that is, only one machine will be used, using only one thread at a time to run the mappers and reducers. This is the default configuration, and therefore anything else needs to be done for configuring it. For other configurations, such as Pseudo-Distributed (multiple threads on a single node) or Distributed (a cluster machine), visit the &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/wiki/Configuration&#34;&gt;LDBC DATAGEN wiki&lt;/a&gt;.&lt;/p&gt;
+&lt;h3 id=&#34;getting-and-configuring-datagen&#34;&gt;Getting and configuring DATAGEN&lt;/h3&gt;
+&lt;p&gt;Before downloading DATAGEN, be sure to fulfill the following requirements:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Linux based machine&lt;/li&gt;
+&lt;li&gt;java 1.6 or greater&lt;/li&gt;
+&lt;li&gt;python 2.7.X&lt;/li&gt;
+&lt;li&gt;maven 3&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;After configuring hadoop, now is the time to get DATAGEN from the LDBC-SNB official repositories. Always download the latest release, which at this time is v0.1.2. Releases page is be found &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/releases&#34;&gt;here&lt;/a&gt;. Again, decompress the downloaded file with the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ tar xvfz ldbc_snb_datagen-0.1.2.tar.gz
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will create a folder called “ldbc_snb_datagen-0.1.2”.&lt;/p&gt;
+&lt;p&gt;DATAGEN provides a &lt;em&gt;run.sh&lt;/em&gt; is a script to automate the compilation and execution of DATAGEN. It needs to be configured for your environment, so open it and set the two variables at the top of the script to the corresponding paths.&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;HADOOP_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/hadoop-1.2.1
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;LDBC_SNB_DATAGEN_HOME&lt;span style=&#34;color:#f92672&#34;&gt;=&lt;/span&gt;/home/user/ldbc_snb_datagen
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;HADOOP_HOME points to the path where hadoop-1.2.1 is installed, while LDBC_SNB_DATAGEN_HOME points to where DATAGEN is installed. Change these variables to the appropriate values. Now, we can execute &lt;em&gt;run.sh&lt;/em&gt; script to compile and execute DATAGEN using default parameters. Type the following commands:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-bash&#34; data-lang=&#34;bash&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ cd /home/user/ldbc_snb_datagen-0.1.2
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;$ ./run.sh
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;This will run DATAGEN, and two folders will be created at the same directory: &lt;em&gt;social_network&lt;/em&gt; containing the scale factor 1 dataset with csv uncompressed files, and &lt;em&gt;substitution_parameters&lt;/em&gt; containing the substituion parameters needed by the driver to execute the benchmark.&lt;/p&gt;
+&lt;h3 id=&#34;changing-the-generated-dataset&#34;&gt;Changing the generated dataset&lt;/h3&gt;
+&lt;p&gt;The characteristics of the dataset to be generated are specified in the &lt;em&gt;params.ini&lt;/em&gt; file. By default, this file has the following content:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:1&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;The following is the list of options and their default values supported by DATAGEN:&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;scaleFactor&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The scale factor of the data to generate. Possible values are: 1, 3, 10, 30, 100, 300 and 1000&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;serializer&lt;/td&gt;
+&lt;td&gt;csv&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;The format of the output data. Options are: csv, csv_merge_foreign, ttl&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;compressed&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;Specifies to compress the output data in gzip.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;outputDir&lt;/td&gt;
+&lt;td&gt;./&lt;/td&gt;
+&lt;td&gt;Specifies the folder to output the data.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;updateStreams&lt;/td&gt;
+&lt;td&gt;FALSE&lt;/td&gt;
+&lt;td&gt;&amp;ldquo;Specifies to generate the update streams of the network. If set to false, then the update portion of the network is output as static&amp;rdquo;&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numThreads&lt;/td&gt;
+&lt;td&gt;1&lt;/td&gt;
+&lt;td&gt;Sets the number of threads to use. Only works for pseudo-distributed mode&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;For instance, a possible &lt;em&gt;params.ini&lt;/em&gt; file could be the following:&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;scaleFactor:30&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:ttl&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For those not interested on generating a dataset for a given predefined scale factor, but for other applications, the following parameters can be specified (they need to be specified all together):&lt;/p&gt;
+&lt;table&gt;
+&lt;thead&gt;
+&lt;tr&gt;
+&lt;th&gt;Option&lt;/th&gt;
+&lt;th&gt;Default value&lt;/th&gt;
+&lt;th&gt;Description&lt;/th&gt;
+&lt;/tr&gt;
+&lt;/thead&gt;
+&lt;tbody&gt;
+&lt;tr&gt;
+&lt;td&gt;numPersons&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The number of persons to generate&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;numYears&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The amount of years of activity&lt;/td&gt;
+&lt;/tr&gt;
+&lt;tr&gt;
+&lt;td&gt;startYear&lt;/td&gt;
+&lt;td&gt;-&lt;/td&gt;
+&lt;td&gt;The start year of simulation.&lt;/td&gt;
+&lt;/tr&gt;
+&lt;/tbody&gt;
+&lt;/table&gt;
+&lt;p&gt;The following is an example of another possible &lt;em&gt;params.ini&lt;/em&gt; file&lt;/p&gt;
+&lt;div class=&#34;highlight&#34;&gt;&lt;pre tabindex=&#34;0&#34; style=&#34;color:#f8f8f2;background-color:#272822;-moz-tab-size:4;-o-tab-size:4;tab-size:4;&#34;&gt;&lt;code class=&#34;language-ini&#34; data-lang=&#34;ini&#34;&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numPersons:100000&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numYears:3&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;startYear:2010&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;serializer:csv_merge_foreign&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;compressed:false&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;updateStreams:true&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;outputDir:/home/user/output&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;span style=&#34;display:flex;&#34;&gt;&lt;span&gt;&lt;span style=&#34;color:#a6e22e&#34;&gt;numThreads:4&lt;/span&gt;
+&lt;/span&gt;&lt;/span&gt;&lt;/code&gt;&lt;/pre&gt;&lt;/div&gt;&lt;p&gt;For more information about the schema of the generated data, the different scale factors and serializers, please visit the wiki page of DATAGEN at &lt;a href=&#34;https://github.com/ldbc/ldbc_snb_datagen_hadoop/&#34;&gt;GitHub&lt;/a&gt;!&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>The Day of Graph Analytics</title>
+      <link>https://ldbcouncil.org/post/the-day-of-graph-analytics/</link>
+      <pubDate>Thu, 09 Oct 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/the-day-of-graph-analytics/</guid>
+      <description>&lt;p&gt;&lt;em&gt;Note: consider this post as a continuation of the &amp;ldquo;&lt;a href=&#34;https://ldbcouncil.org/post/making-it-interactive&#34;&gt;Making it interactive&lt;/a&gt;&amp;rdquo; post by Orri Erling.&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;I have now completed the &lt;a href=&#34;https://github.com/openlink/virtuoso-opensource&#34;&gt;Virtuoso&lt;/a&gt; TPC-H work, including scale out. Optimization possibilities extend to infinity but the present level is good enough. &lt;a href=&#34;http://www.tpc.org/tpch/&#34;&gt;TPC-H&lt;/a&gt; is the classic of all analytics benchmarks and is difficult enough, I have extensive commentary on this on my blog (In Hoc Signo Vinces series), including experimental results. This is, as it were, the cornerstone of the true science. This is however not the totality of it. From the LDBC angle, we might liken this to the last camp before attempting a mountain peak.&lt;/p&gt;
+&lt;p&gt;So, we may now seriously turn to graph analytics. The project has enough left to run in order to get a good BI and graph analytics workload. In LDBC in general, as in the following, BI or business intelligence means complex analytical queries. Graph analytics means graph algorithms that are typically done in graph programming frameworks or libraries.&lt;/p&gt;
+&lt;p&gt;The BI part is like TPC-H, except for adding the following challenges:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;Joins of derived tables with group by, e.g. comparing popularity of items on consecutive time periods.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitive dimensions - A geographical or tag hierarchy can be seen as a dimension table. To get the star schema plan with the selective hash join, the count of the transitive traversal of the hierarchy (hash build side) must be correctly guessed.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Transitivity in fact table, i.e. average length of reply thread. There the cost model must figure that the reply link is much too high cardinality for hash build side, besides a transitive operation is not a good candidate for a build in multiple passes, hence the plan will have to be by index.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Graph traversal with condition on end point and navigation step. The hierarchical dimensions and reply threads are in fact trees, the social graph is not. Again the system must know some properties of connectedness (in/out degree, count of vertices) to guess a traversal fanout. This dictates the join type in the step (hash or index). An example is a transitive closure with steps satisfying a condition, e.g. all connected persons have a specific clearance.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Running one query with parameters from different buckets, implying different best plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Data correlations, e.g. high selectivity arising from two interests seldom occurring together, in places where the correct estimation makes the difference between a good and a bad plan.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Large intermediate results stored in tables, as in materializing complex summaries of data for use in follow up queries.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;More unions and outer joins.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The idea is to cover the base competences the world has come to expect and to build in challenges to last another 10-15 years.&lt;/p&gt;
+&lt;p&gt;For rules and metric, we can use the TPC-H or &lt;a href=&#34;http://www.tpc.org/tpcds/default.asp&#34;&gt;TPC-DS&lt;/a&gt; ones as a template. The schema may differ from an implementation of the interactive workload, as these things would normally run on different systems anyway. As another activity that is not directly LDBC, I will do a merge of SNB and &lt;a href=&#34;http://www.openstreetmap.org/&#34;&gt;Open Street Map&lt;/a&gt;. The geolocated things (persons, posts) will get real coordinates from their vicinity and diverse geo analytics will become possible. This is of some significant interest to Geoknow, another FP7 where OpenLink is participating.&lt;/p&gt;
+&lt;p&gt;Doing the BI mix and even optimizing the interactive part involves some redoing of the present support for transitivity in Virtuoso. The partitioned group by with some custom aggregates is the right tool for the job, with all parallelization, scale-out, etc ready. You see, TPC-H is very useful also in places one does not immediately associate with it.&lt;/p&gt;
+&lt;p&gt;As a matter of fact, this becomes a BSP (bulk synchronous processing) control structure. Run any number of steps, each item produces results/effects scattered across partitions. The output of the previous is the input of the next. We might say BSP is an attractor or &amp;ldquo;Platonic&amp;rdquo; control structure to which certain paths inevitably lead. Last year I did a BSP implementation in SQL, reading and writing tables and using transactions for serializable update of the border. This is possible but will not compete with a memory based framework and not enough of the optimization potential, e.g. message combining, is visible to the engine in this formulation. So, now we will get this right, as suggested.&lt;/p&gt;
+&lt;p&gt;So, the transitive derived table construct can have pluggable aggregations, e.g. remembering a path, a minimum length or such), reduction like a scalar-valued aggregate (min/max), different grouping sets like in a group by with cube or grouping sets, some group-by like reduction for message combining and so forth. If there is a gather phase that is not just the result of the scatter of the previous step, this can be expressed as an arbitrary database query, also cross partition in a scale-out setting.&lt;/p&gt;
+&lt;p&gt;The distributed/partitioned group by hash table will be a first class citizen, like a procedure scoped temporary table to facilitate returning multiple results and passing large data between multiple steps with different vertex operations, e.g. forward and backward in betweenness centrality.&lt;/p&gt;
+&lt;p&gt;This brings us to the graph analytics proper, which is often done in BSP style, e.g. &lt;a href=&#34;http://es.slideshare.net/shatteredNirvana/pregel-a-system-for-largescale-graph-processing&#34;&gt;Pregel&lt;/a&gt;, &lt;a href=&#34;http://giraph.apache.org&#34;&gt;Giraph&lt;/a&gt;, &lt;a href=&#34;http://uzh.github.io/signal-collect/&#34;&gt;Signal-Collect&lt;/a&gt;, some but not all &lt;a href=&#34;http://ppl.stanford.edu/main/green_marl.html&#34;&gt;Green-Marl&lt;/a&gt; applications. In fact, a Green-Marl back end for Virtuoso is conceivable, whether one will be made is a different matter.&lt;/p&gt;
+&lt;p&gt;With BSP in the database engine, a reference implementation of many standard algorithms is readily feasible and performant enough to do reasonable sizing for the workload and to have a metric. This could be edges or vertices per unit of time, across a mix of algorithms, for example. Some experimentation will be needed. The algorithms themselves may be had from the Green-Marl sample programs or other implementations. Among others, Oracle would presumably agree that this sort of functionality will in time migrate into core database. We will here have a go at this and along the way formulate some benchmark tasks for a graph analytics workload. Whenever feasible, this will derive from existing work such as &lt;a href=&#34;http://graphbench.org/&#34;&gt;graphbench.org&lt;/a&gt; but will be adapted to the SNB dataset.&lt;/p&gt;
+&lt;p&gt;The analytics part will be done with more community outreach than the interactive one. I will blog about the business questions, queries and choke points as we go through them. The interested may pitch in as the matter comes up.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Using LDBC SPB to Find OWLIM Performance Issues</title>
+      <link>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</link>
+      <pubDate>Wed, 20 Aug 2014 00:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/post/using-ldbc-spb-to-find-owlim-performance-issues/</guid>
+      <description>&lt;p&gt;During the past six months we (the OWLIM Team at Ontotext) have integrated the LDBC &lt;a href=&#34;https://ldbcouncil.org/developer/spb&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt; (LDBC-SPB) as a part of our development and release process.&lt;/p&gt;
+&lt;p&gt;First thing we’ve started using the LDBC-SPB for is to monitor the performance of our RDF Store when a new release is about to come out.&lt;/p&gt;
+&lt;p&gt;Initially we’ve decided to fix some of the benchmark parameters :&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;the dataset size - 50 million triples (LDBC-SPB50) * benchmark warmup and benchmark run times - 60s and 600s respectively.  * maximum number of Editorail Agents (E) : 2 (threads that will execute INSERT/UPDATE operations) * maximum number of Aggregation Agents (A) : 16 (threads that will execute SELECT operations) * generated data by the benchmark driver to be “freshly” deployed before each benchmark run - benchmark driver can be configured to generate the data and stop. We’re using that option and have a fresh copy of it put aside ready for each run.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Having those parameters fixed, running LDBC-SPB is a straight-forward task. The hardware we’re using for benchmarking is a machine with 2 Intel Xeon CPUs, 8 cores each, 256 GB of memory and SSD storage, running Linux. Another piece of hardware we’ve tested with is a regular desktop machine with Intel i7, 32 GB of memory and HDD storage. During our experiments we have allowed a deviation in results of 5% to 10% because of the multi-threaded nature of the benchmark driver.&lt;/p&gt;
+&lt;p&gt;We’ve also decided to produce some benchmark results on Amazon’s EC2 Instances and compare with the results we’ve had so far. Starting with m3.2xlarge instance (8 vCPUs, 30GB of memory and 2x80GB SSD storage) on a 50M dataset we’ve achieved more than 50% lower results than ones on our own hardware. On a largrer Amazon Instance c3.4xlarge (16 vCPUs, 30GB of memory and doubled SSD storage) we’ve achieved the same performance in terms of aggregation operations and even worse performance in terms for editorial operations, which we give to the fact that Amazon instances are not providing consistent performance all the time.&lt;/p&gt;
+&lt;p&gt;Following two charts are showing how OWLIM performs on different hardware and with different configurations. They also give an indication of Amazon’s capabilities compared to the results achieved on a bare-metal hardware.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;16-2-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 1 : OWLIM Performance : 2 amazon instances and 2 local machines. 16 aggregation and 2 editorial agents running simultaneously. Aggregation and editorial operations displayed here should  be considered independently, i.e. even though editorial opeartions graph shows higher results on Amazon m3.2xlarge instance, values are normalized and are referring to corresponding type of operation.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;8-0-Performance.png&#34; alt=&#34;image&#34;&gt;&lt;/p&gt;
+&lt;p&gt;Figure 2 : OWLIM Performance : 2 amazon instances and 2 local machines. 8 aggregation running simultaneously. Read-only mode.&lt;/p&gt;
+&lt;p&gt;Another thing that we’re using LDBC-SPB for is to monitor load performance speeds. Loading of generated data can be done either manually by creating some sort of a script (CURL), or by the benchmark driver itself which will execute a standard POST request against a provided SPARQL endpoint. Benchmark&amp;rsquo;s data generator can be configured to produce chunks of generated data in various sizes, which can be used for exeperiments on load performance. Of course load times of forward-chaining reasoners can not be compared to backward-chaining ones which is not the goal of the benchmark. Loading performances is not measured “officially“ by LDBC-SPB (although time for loading the data is reported), but its good thing to have when comparing RDF Stores.&lt;/p&gt;
+&lt;p&gt;An additional and interesting feature of the SPB is the test for conformance to OWL2-RL rule-set. It is a part of the LDBC-SPB benchmark and that phase is called &lt;em&gt;checkConformance&lt;/em&gt;. The phase is run independently of the benchmark phase itself. It requires no data generation or loading except the initial set of ontologies. It tests RDF store’s capabilities for conformance to the rules in OWL2-RL rule-set by executing a number of INSERT/ASK queries specific for each rule. The result of that phase is a list of all rules that have been passed or failed which is very useful for regression testing.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Fourth TUC meeting</title>
+      <link>https://ldbcouncil.org/event/fourth-tuc-meeting/</link>
+      <pubDate>Thu, 03 Apr 2014 12:32:22 -0400</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/fourth-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the fourth Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a one-day event at CWI in Amsterdam on &lt;em&gt;Thursday April 3, 2014&lt;/em&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;For presenters please limit your talks to just 15 minutes&lt;/strong&gt;&lt;/p&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 3rd&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;10:00 Peter Boncz (VUA) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506371.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=JYWVgrP1kVY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;LDBC project status update&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:20 Norbert Martinez (UPC) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506375.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=4yREJQ3yDr0&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Status update on the LDBC Social  Network Benchmark (SNB) task force&lt;/em&gt;.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;10:50 Alexandru Iosup (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506363.ppt&#34;&gt;ppt&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=ulT-RFwKpOE&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Towards Benchmarking Graph-Processing Platforms&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;11:10 Mike Bryant (Kings College) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506364.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=KiHRTu9xx0A&#34;&gt;video&lt;/a&gt;: &lt;em&gt;EHRI Project: Archival Integration with Neo4j&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;11:30 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;11:50 Thilo Muth (University of Magdeburg) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506369.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=5xH3UDLP6Oc&#34;&gt;video&lt;/a&gt;: &lt;em&gt;MetaProteomeAnalyzer: a graph database backed software for functional and taxonomic protein data analysis&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:10 Davy Suvee (Janssen Pharmaceutica / Johnson &amp;amp; Johnson) – &lt;a href=&#34;https://www.youtube.com/watch?v=XN3LRJUfJIU&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Euretos Brain - Experiences on using a graph database to analyse data stored as a scientific knowledge graph&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:30 Yongming Luo (TU Eindhoven) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506366.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=g_my3tBB2_s&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Regularities and dynamics in bisimulation reductions of big graphs&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;12:50 Christopher Davis (TU Delft) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506370.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/channel/UC6HbzfJ4016Vez-2HKNeDag&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Enipedia - Enipedia is an active exploration into the applications of wikis and the semantic web for energy and industry issues&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;13:10 - 14:30 lunch @ restaurant Polder&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;14:30 &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506365.pptx&#34;&gt;SPB task force report&lt;/a&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:00 Bastiaan Bijl (Sysunite) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506373.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=TsCeKDHShMY&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Using a semantic approach for monitoring applications in large engineering projects&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:20 Frans Knibbe (Geodan) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506372.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=uAX-m4OewPM&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Benchmarks for geographical data&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;15:40 Armando Stellato (University of Rome, Tor Vergata &amp;amp; UN Food and Agriculture Organization) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506374.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=mfA4csAs72Y&#34;&gt;video&lt;/a&gt;: &lt;em&gt;VocBench2.0, a Collaborative Environment for SKOS/SKOS-XL Management: scalability and (inter)operatibility challenges&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;16:00 coffee&lt;/strong&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;
+&lt;p&gt;16:20 Ralph Hodgson (TopQuadrant) – [pdf](https://pu b-3834 10a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachment s/5538064/5506367.pdf), &lt;a href=&#34;https://www.youtube.com/watch?v=ZUDnVw9P_Rc&#34;&gt;video&lt;/a&gt;:&lt;em&gt;Customer experiences in implementing SKOS-based vocabularymanagement systems&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;16:40 Simon Jupp (European Bioinformatics Institute) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506368.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=CgTuOGK92W8&#34;&gt;video&lt;/a&gt;: &lt;em&gt;[Delivering RDF for the life science at the European Bioinformatics Institute: Six months in.]&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:00 Jerven Bolleman (Swiss Institute of Bioinformatics) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506381.pdf&#34;&gt;pdf&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=QTc3yOgoEsg&#34;&gt;video&lt;/a&gt;: &lt;em&gt;Breakmarking UniProt RDF. SPARQL queries that make your database cry&amp;hellip;&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:20 Rein van &amp;rsquo;t Veer (Digital Heritage Netherlands) – &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506380.pptx&#34;&gt;pptx&lt;/a&gt;, &lt;a href=&#34;https://www.youtube.com/watch?v=2vDrZoskGyQ&#34;&gt;video&lt;/a&gt; &lt;em&gt;Time and space for heritage&lt;/em&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;17:40 &lt;strong&gt;end of meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;19:00 - 21:30 Social Dinner in restaurant Boom&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;strong&gt;April 4th&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;LDBC plenary meeting for project partners.&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5506362.ppt&#34;&gt;Benchmarking Graph-Processing Platforms: A Vision&lt;/a&gt; – Alexandru Iosup&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;The meeting will be held at the Dutch national research institute for computer science and mathematics (&lt;a href=&#34;http://www.cwi.nl&#34;&gt;CWI&lt;/a&gt; - Centrum voor Wiskunde en Informatica). It is located at &lt;a href=&#34;http://www.amsterdamsciencepark.nl/&#34;&gt;Amsterdam Science Park&lt;/a&gt;:&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505821.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;(&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/fourth-tuc-meeting/attachments/5538064/5505820.pdf&#34;&gt;A5 map&lt;/a&gt;)&lt;/p&gt;
+&lt;h6 id=&#34;travel&#34;&gt;Travel&lt;/h6&gt;
+&lt;p&gt;&lt;strong&gt;Arriving &amp;amp; departing:&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Amsterdam has a well-functioning and nearby airport called Schiphol (AMS, &lt;a href=&#34;http://www.schiphol.com/&#34;&gt;www.schiphol.nl&lt;/a&gt;) that serves all main European carriers and also very many low-fare carriers.&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&#34;&gt;http://www.iamsterdam.com/en/visiting/touristinformation/gettingaround/arrival-and-departure/arrival-by-plane&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Trains&lt;/strong&gt; (~5 per hour) are the most convenient means of transport between Schiphol airport and Amsterdam city center, the Centraal Station (17 minutes, a train every 15 minutes) &amp;ndash; which station you are also likely arriving at in case of an international train trip.&lt;/p&gt;
+&lt;p&gt;From the Centraal Station in Amsterdam, there is a direct train (every half an hour, runs 11 minutes) to the Science Park station, which is walking distance of CWI.  If you go from the Centraal Station to one of the hotels, you should take tram 9 &amp;ndash; it starts at Centraal Station (exception: for Hotel Casa 400, you should take the metro to Amstel station - any of the metros will do).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi&lt;/strong&gt; is an alternative, though expensive. The price from Schiphol will be around 45 EUR to the CWI or another point in the city center (depending on traffic, the ride is 20-30 minutes).&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Public transportation&lt;/strong&gt; (tram, bus, metro) tickets for a single ride and 1-day (24 hour) passes can be purchased from the driver/conductor on trams and buses (cash only) and from vending machines in the metro stations.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Only the &amp;ldquo;disposable&amp;rdquo; cards are interesting for you as visitor.&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;Multi-day (up to 7-days/168 hours) passes can only be purchased from the vending machines or from the ticket office opposite of Centraal Station.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Getting Around:&lt;/strong&gt; the fastest way to move in the city of Amsterdam generally is by bicycle. Consider renting such a device at your hotel. For getting from your hotel to the CWI, you can either take a taxi (expensive), have a long walk (35min), use public transportation (for NH Tropen/The Manor take bus 40 from Muiderpoort Station, for Hotel Casa 400 same bus 40 but from Amstel station, and for the Rembrandt Hotel it is tram 9 until Middenweg/Kruislaan and then bus 40), or indeed bike for 12 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Cars&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;In case you plan to arrive by car, please be aware that parking space in Amsterdam is scarce and hence very expensive. But, you can park your car on the &amp;ldquo;WCW&amp;rdquo; terrain where CWI is located. To enter the terrain by car, you have to get a ticket from the machine at the gate. To leave the terrain, again, you can get an exit ticket from the CWI reception.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Arriving at CWI:&lt;/strong&gt; Once you arrive at CWI, you need to meet the reception, and tell them that you are attending the LDBC TUC meeting. Then, you&amp;rsquo;ll receive a visitor&amp;rsquo;s pass that allows you to enter our building.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Social Dinner&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The social dinner will take place at 7pm on April 3 in Restaurant Boom (&lt;a href=&#34;http://www.boometenendrinken.nl/&#34;&gt;boometenendrinken.nl&lt;/a&gt;), Linneausstraat 63, Amsterdam.&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Third TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/third-tuc-meeting/</link>
+      <pubDate>Tue, 19 Nov 2013 08:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/third-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium is pleased to announce the third Technical User Community (TUC) meeting!&lt;/p&gt;
+&lt;p&gt;This will be a one day event in London on the &lt;strong&gt;19 November 2013&lt;/strong&gt; running in collaboration with the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; event (18/19 November). Registered TUC participants that would like a free pass to all of GraphConnect should register for GraphConnect using this following coupon code: &lt;strong&gt;LDBCTUC&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The TUC event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;We will also be launching the LDBC non-profit organization, so anyone outside the EU project will be able to join as a member.&lt;/p&gt;
+&lt;p&gt;We will kick off  new benchmark development task forces in the coming year, and talks at this coming TUC will play an important role in deciding the use case scenarios that will drive those benchmarks.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;November 19th - Public TUC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;8:00 Breakfast and registration will open for Graph Connect/TUC at 8:00 am (Dexter House)&lt;/p&gt;
+&lt;p&gt;short LDBC presentation (Peter Boncz) during GraphConnect keynote by Emil Eifrem (09:00-09:30 Dexter House)&lt;/p&gt;
+&lt;p&gt;NOTE: the TUC meeting is at the Tower Hotel, nearby Dexter House.&lt;/p&gt;
+&lt;p&gt;10:00 TUC Meeting Opening (Peter Boncz)&lt;/p&gt;
+&lt;p&gt;10:10 TUC Presentations (RDF Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Johan Hjerling (BBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275669.pdf&#34;&gt;BBC Linked Data and the Semantic Publishing Benchmark&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andreas Both (Unister): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505027.pdf&#34;&gt;Ontology-driven applications in an e-commerce context&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Nuno Carvalho (Fujitsu Laboratories Europe): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275666.pdf&#34;&gt;&lt;em&gt;&lt;strong&gt;Fujitsu RDF use cases and benchmarking requirements&lt;/strong&gt;&lt;/em&gt;&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;Robina Clayphan (Europeana): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816977.ppt&#34;&gt;Europeana and Open Data&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;11:30 Semantic Publishing Benchmark (SPB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Venelin Kotsev (Ontotext - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;Semantic Publishing Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;report&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;12:00-13:00 Lunch at the Graph Connect venue&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Talks During Lunch:&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Pedro Furtado, Jorge Bernardino (Univ. Coimbra): &lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275671.pdf&#34;&gt;KEYSTONE Cost Action&lt;/a&gt;&lt;/strong&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;13:00 TUC Presentations (Graph Application Descriptions)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Minqi Zhou / Weining Qian (East China Normal University): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275670.pdf&#34;&gt;Elastic and realistic social media data generation&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Andrew Sherlock (Shapespace): &lt;em&gt;&lt;strong&gt;Shapespace Use Case&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Sebastian Verheughe (Telenor): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275667.pdf&#34;&gt;Real-time Resource Authorization&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;14:00 Social Network Benchmark (SNB)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Norbert Martinez (UPC - LDBC): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505025.pdf&#34;&gt;Social Network Benchmark Task Force Update&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt; and &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816975.pdf&#34;&gt;Report&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;14:30 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;14:45 TUC Presentations (Graph Analytics)&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Keith Houck (IBM): &lt;em&gt;&lt;strong&gt;Benchmarking experiences with [System G Native Store (tentative title)]&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Abraham Bernstein (University of Zurich): &lt;em&gt;&lt;strong&gt;Streams and Advanced Processing: Benchmarking RDF querying beyond the Standard SPARQL Triple Store&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Luis Ceze (University of Washington): &lt;em&gt;&lt;strong&gt;Grappa and GraphBench Status Update&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;em&gt;15:45 Break&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;16:00 TUC Presentations* (Possible Future RDF Benchmarking Topics)*&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Christian-Emil Ore (Unit for Digital Documentation, University of Oslo, Norway): &lt;em&gt;&lt;strong&gt;CIDOC-CRM&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Atanas Kiryakov (Ontotext): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275672.pdf&#34;&gt;Large-scale Reasoning with a Complex Cultural Heritage Ontology (CIDOC CRM)&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Kostis Kyzirakos (National and Kapodistrian University of Athens / CWI): &lt;em&gt;&lt;strong&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5275668.pdf&#34;&gt;Geographica: A Benchmark for Geospatial RDF Stores&lt;/a&gt;&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Xavier Lopez (Oracle): &lt;em&gt;&lt;strong&gt;W3C Property Graph progress&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;li&gt;Thomas Scharrenbach (University Zurich) &lt;em&gt;&lt;strong&gt;PCKS:  Benchmarking Semantic Flow Processing Systems&lt;/strong&gt;&lt;/em&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;17:20 Meeting Conclusion (Josep Larriba Pey)&lt;/p&gt;
+&lt;p&gt;17:30 End of TUC meeting&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;November 20th - Internal LDBC Meeting&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Start&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;coffee and lunch provided&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;Date&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;19th November 2013&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Location&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;The TUC meeting will be held in &lt;strong&gt;The Tower&lt;/strong&gt; hotel (&lt;a href=&#34;http://goo.gl/qZt8Fz&#34;&gt;Google Maps link&lt;/a&gt;) approximately 4 minutes walk from the &lt;a href=&#34;http://www.graphconnect.com/london/&#34;&gt;GraphConnect&lt;/a&gt; conference in London.&lt;/p&gt;
+&lt;p&gt;Getting there&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;From City Airport is the easiest: short ride on the DLR to Tower Gateway. Easy.&lt;/li&gt;
+&lt;li&gt;From London Heathrow: first need to take the Heathrow Express to Paddington. Then take the Circle line to Tower Hill. &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554995.pdf&#34;&gt;See attached&lt;/a&gt;.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;ldbctuc-background&#34;&gt;LDBC/TUC Background&lt;/h3&gt;
+&lt;p&gt;Looking back, we have been working on two benchmarks for the past year: a Social Network Benchmark (SNB) and a Semantic Publishing Benchmark (SPB). While below we provide a short summary, all the details of the work on these benchmark development efforts can be found in the first yearly progress reports:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SNB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4816974.pdf&#34;&gt;LDBC_SPB_Report_Nov2013.pdf&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;A summary of these efforts can be read below or, for a more detailed account, please refer to: &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/4554967.pdf&#34;&gt;The Linked Data Benchmark Council: a Graph and RDF industry benchmarking effort&lt;/a&gt;. Annual reports about the progress, results, and future work of these two efforts will soon be available for download here, and will be discussed in depth at the TUC.&lt;/p&gt;
+&lt;h4 id=&#34;social-network-benchmark&#34;&gt;Social Network Benchmark&lt;/h4&gt;
+&lt;p&gt;The Social Network Benchmark (SNB) is designed for evaluating a broad range of technologies for tackling graph data management workloads. The systems targeted are quite broad: from graph, RDF, and relational database systems to Pregel-like graph compute frameworks. The social network scenario was chosen with the following goals in mind:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;it should be understandable, and the relevance of managing such data should be understandable&lt;/li&gt;
+&lt;li&gt;it should cover the complete range of interesting challenges, according to the benchmark scope&lt;/li&gt;
+&lt;li&gt;the queries should be realistic, i.e., similar data and workloads are encountered in practice&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB includes a data generator for creation of synthetic social network data with the following characteristics:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;data schema is representative of real social networks&lt;/li&gt;
+&lt;li&gt;data generated includes properties occurring in real data, e.g. irregular structure, structure/value correlations, power-law distributions&lt;/li&gt;
+&lt;li&gt;the software generator is easy-to-use, configurable and scalable&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;SNB is intended to cover a broad range of aspects of social network data management, and therefore includes three distinct workloads:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Interactive&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests system throughput with relatively simple queries and concurrent updates, it is designed to test ACID features and scalability in an online operational setting.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer transactional functionality.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Business Intelligence&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Consists of complex structured queries for analyzing online behavior of users for marketing purposes, it is designed to stress query execution and optimization.&lt;/li&gt;
+&lt;li&gt;The targeted systems are expected to be those that offer an abstract query language.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Graph Analytics&lt;/strong&gt;
+&lt;ul&gt;
+&lt;li&gt;Tests the functionality and scalability of systems for graph analytics, which typically cannot be expressed in a query language.&lt;/li&gt;
+&lt;li&gt;Analytics is performed on most/all of the data in the graph as a single operation and produces large intermediate results, and it is not not expected to be transactional or need isolation.&lt;/li&gt;
+&lt;li&gt;The targeted systems are graph compute frameworks though database systems may compete, for example by using iterative implementations that repeatedly execute queries and keep intermediate results in temporary data structures.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;semantic-publishing-benchmark&#34;&gt;Semantic Publishing Benchmark&lt;/h4&gt;
+&lt;p&gt;The Semantic Publishing Benchmark (SPB) simulates the management and consumption of RDF metadata that describes media assets, or creative works.&lt;/p&gt;
+&lt;p&gt;The scenario is a media organization that maintains RDF descriptions of its catalogue of creative works &amp;ndash; input was provided by actual media organizations which make heavy use of RDF, including the BBC. The benchmark is designed to reflect a scenario where a large number of aggregation agents provide the heavy query workload, while at the same time a steady stream of creative work description management operations are in progress. This benchmark only targets RDF databases, which support at least basic forms of semantic inference. A tagging ontology is used to connect individual creative work descriptions to instances from reference datasets, e.g. sports, geographical, or political information. The data used will fall under the following categories: reference data, which is a combination of several Linked Open Data datasets, e.g. GeoNames and DBpedia; domain ontologies, that are specialist ontologies used to describe certain areas of expertise of the publishing, e.g., sport and education; publication asset ontologies, that describe the structure and form of the assets that are published, e.g., news stories, photos, video, audio, etc.; and tagging ontologies and the metadata, that links assets with reference/domain ontologies.&lt;/p&gt;
+&lt;p&gt;The data generator is initialized by using several ontologies and datasets. The instance data collected from these datasets are then used at several points during the execution of the benchmark. Data generation is performed by generating SPARQL fragments for create operations on creative works and executing them against the RDF database system.&lt;/p&gt;
+&lt;p&gt;Two separate workloads are modeled in SPB:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;strong&gt;Editorial:&lt;/strong&gt; Simulates creating, updating and deleting creative work metadata descriptions.  Media companies use both manual and semi-automated processes for efficiently and correctly managing asset descriptions, as well as annotating them with relevant instances from reference ontologies.&lt;/li&gt;
+&lt;li&gt;&lt;strong&gt;Aggregation:&lt;/strong&gt; Simulates the dynamic aggregation of content for consumption by the distribution pipelines (e.g. a web-site). The publishing activity is described as &amp;ldquo;dynamic&amp;rdquo;, because the content is not manually selected and arranged on, say, a web page. Instead, templates for pages are defined and the content is selected when a consumer accesses the page.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/third-tuc-meeting/attachments/4325436/5505026.pdf&#34;&gt;Status of the Semantic Publishing Benchmark&lt;/a&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>Second TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/second-tuc-meeting/</link>
+      <pubDate>Mon, 22 Apr 2013 10:00:00 +0000</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/second-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the second Technical User Community (TUC) meeting.&lt;/p&gt;
+&lt;p&gt;This will be a two day event in Munich on the &lt;strong&gt;22/23rd April 2013&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;The event will include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction to the objectives and progress of the LDBC project.&lt;/li&gt;
+&lt;li&gt;Description of the progress of the benchmarks being evolved through Task Forces.&lt;/li&gt;
+&lt;li&gt;Users explaining their use-cases and describing the limitations they have found in current technology.&lt;/li&gt;
+&lt;li&gt;Industry discussions on the contents of the benchmarks.&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#social-dinner&#34;&gt;Social Dinner&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;&lt;strong&gt;April 22nd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 &lt;em&gt;Registration.&lt;/em&gt;&lt;br&gt;
+10:30 Josep Lluis Larriba Pey (UPC) - &lt;em&gt;Welcome and Introduction.&lt;/em&gt;&lt;br&gt;
+10:30 Peter Boncz (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687373.pptx&#34;&gt;LDBC: goals and status&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Social Network Use Cases (with discussion moderated by Josep Lluis Larriba Pey)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:00 Josep Lluis Larriba Pey (UPC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687372.pdf&#34;&gt;Social Network Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+11:30 Gustavo González (Mediapro): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687367.pdf&#34;&gt;Graph-based User Modeling through Real-time Social Streams&lt;/a&gt;&lt;br&gt;
+12:00 Klaus Großmann (Dshini): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687365.pdf&#34;&gt;Neo4j at Dshini&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;12:30 Lunch&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Semantic Publishing Use Cases (with discussion moderated by Barry Bishop)&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;13:30 Barry Bishop (Ontotext): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687366.pptx&#34;&gt;Semantic Publishing Benchmark Task Force&lt;/a&gt;&lt;br&gt;
+14:00 Dave Rogers (BBC): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687364.pptx&#34;&gt;Linked Data Platform at the BBC&lt;/a&gt;&lt;br&gt;
+14:30 Edward Thomas (Wolters Kluwer): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687374.pdf&#34;&gt;Semantic Publishing at Wolters Kluwer&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;15:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Projects Related to LDBC&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;15:30 Fabian Suchanek (MPI): &amp;ldquo;YAGO: A large knowledge base from Wikipedia and WordNet&amp;rdquo;&lt;br&gt;
+16:00 Antonis Loziou (VUA): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687375.pptx&#34;&gt;The OpenPHACTS approach to data integration&lt;/a&gt;&lt;br&gt;
+16:30 Mirko Kämpf (Brox): &amp;ldquo;GeoKnow - Spatial Data Web project and Supply Chain Use Case&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;17:00 &lt;em&gt;End of first day&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;19:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;April 23rd&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Industry &amp;amp; Hardware Aspects&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Xavier Lopez (Oracle): &lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687384.pdf&#34;&gt;Graph Database Performance an Oracle Perspective.pdf&lt;/a&gt;&lt;br&gt;
+10:30 Pedro Trancoso (University of Cyprus): &amp;ldquo;Benchmarking and computer architecture: the research side&amp;rdquo;&lt;/p&gt;
+&lt;p&gt;11:00 Coffee break&lt;/p&gt;
+&lt;p&gt;&lt;em&gt;Future Steps and TUC feedback session&lt;/em&gt;&lt;/p&gt;
+&lt;p&gt;11:30 Peter Boncz (VUA) moderates: next steps in the Social Networking Task Force&lt;br&gt;
+12:00 Barry Bishop (Ontotext) moderates: next steps in the Semantic Publishing Task Force&amp;quot;&lt;/p&gt;
+&lt;p&gt;12:30 &lt;em&gt;End of meeting&lt;/em&gt;&lt;/p&gt;
+&lt;h3 id=&#34;logistics&#34;&gt;Logistics&lt;/h3&gt;
+&lt;h4 id=&#34;date&#34;&gt;Date&lt;/h4&gt;
+&lt;p&gt;22nd and 23th April 2013&lt;/p&gt;
+&lt;h4 id=&#34;location&#34;&gt;Location&lt;/h4&gt;
+&lt;p&gt;The TUC meeting will be held at LE009 room at LRZ (Leibniz-Rechenzentrum) located inside the TU Munich campus in Garching, Germany. The address is:&lt;/p&gt;
+&lt;p&gt;LRZ (Leibniz-Rechenzentrum)&lt;br&gt;
+Boltzmannstraße 1&lt;br&gt;
+85748 Garching, Germany&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi and Subway &lt;a href=&#34;http://www.in.tum.de/fileadmin/user_upload/Sonstiges/anfahrt_garching.pdf&#34;&gt;Ubahn&lt;/a&gt;&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-city-center-subway-u-bahn&#34;&gt;Getting to the TUM Campus from the Munich city center: Subway (U-Bahn)&lt;/h5&gt;
+&lt;p&gt;Take the U-bahn line U6 in the direction of Garching-Forschungszentrum, exit at the end station. Take the south exit to MI-Building and LRZ on the Garching Campus. The time of the journey from the city center is approx. 25-30 minutes. In order to get here from the City Center, you need the Munich XXL ticket that costs around 7.50 euros and covers all types of transportation for one day. The ticket has to be validated before ride.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-the-munich-airport&#34;&gt;Getting to the TUM Campus from the Munich Airport&lt;/h5&gt;
+&lt;ol&gt;
+&lt;li&gt;
+&lt;p&gt;(except weekends) S-Bahn S8 line in the direction of (Hauptbahnhof) Munich Central Station until the third stop, Ismaning (approx. 13 minutes). From here Bus Nr. 230 until stop MI-Building on the Garching Campus. Alternatively: S1 line until Neufahrn, then with the Bus 690, which stops at Boltzmannstraße.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;S-Bahn lines S8 or S1 towards City Center until Marienplatz stop. Then change to U-bahn U6 line towards Garching-Forschungszentrum, exit at the last station. Take the south exit to MI-Building and LRZ.&lt;/p&gt;
+&lt;/li&gt;
+&lt;li&gt;
+&lt;p&gt;Taxi: fare is ca. 30-40 euros.&lt;/p&gt;
+&lt;/li&gt;
+&lt;/ol&gt;
+&lt;p&gt;For cases 1 and 2, before the trip get the One-day Munich Airport ticket and validate it. It will cover all public transportation for that day.&lt;/p&gt;
+&lt;h5 id=&#34;getting-to-the-tum-campus-from-garching-u-bahn&#34;&gt;Getting to the TUM Campus from Garching: U-Bahn&lt;/h5&gt;
+&lt;p&gt;The city of Garching is located on the U6 line, one stop before the Garching-Forschungszentrum. In order to get from Garching to Garching-Forschungszentrum with the U-bahn, a special one-way ticket called Kurzstrecke (1.30 euros) can be purchased.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding LRZ@TUM&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;http://www.openstreetmap.org/?mlat=48.2615702464&amp;amp;mlon=11.6686558264&amp;amp;zoom=32&#34;&gt;OpenStreetMap link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;a href=&#34;https://maps.google.com/maps?q=48.2615702464,11.6686558264&amp;amp;spn=0.005,0.005&amp;amp;t=k&#34;&gt;Google Maps link&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687268.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/second-tuc-meeting/attachments/2523698/2687269.gif&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying: Munich&lt;/strong&gt; airport is located 28.5 km northeast of Munich. There are two ways to get from the airport to the city center: suburban train (S-bahn) and Taxi.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;S-Bahn:&lt;/strong&gt; S-bahn lines S1 and S8 will get you from the Munich airport to the city center, stopping at both Munich Central Station (Hauptbahnhof) and Marienplatz. One-day Airport-City ticket costs 11.20 euros and is valid for the entire Munich area public transportation during the day of purchase (the tickets needs to be validated before the journey). S-bahn leaves every 5-20 minutes and reaches the city center in approx. 40 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; taxi from the airport to the city center costs approximately 50 euros&lt;/p&gt;
+&lt;h4 id=&#34;social-dinner&#34;&gt;Social Dinner&lt;/h4&gt;
+&lt;p&gt;The social dinner will take place at 7 pm on April 22 in Hofbräuhaus (second floor)&lt;/p&gt;
+&lt;p&gt;Address: Hofbräuhaus, Platzl 9, Munich&lt;/p&gt;
+</description>
+    </item>
+    
+    <item>
+      <title>First TUC Meeting</title>
+      <link>https://ldbcouncil.org/event/first-tuc-meeting/</link>
+      <pubDate>Mon, 19 Nov 2012 09:00:00 +0100</pubDate>
+      
+      <guid>https://ldbcouncil.org/event/first-tuc-meeting/</guid>
+      <description>&lt;p&gt;The LDBC consortium are pleased to announce the first Technical User Community (TUC) meeting. This will be a two day event in Barcelona on the &lt;strong&gt;19/20th November 2012&lt;/strong&gt;.&lt;/p&gt;
+&lt;p&gt;So far more than six commercial consumers of graph/RDF database technology have expressed an interest in attending the event and more are welcome. The proposed format of the event wil include:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;Introduction by the coordinator and technical director explaining the objectives of the LDBC project&lt;/li&gt;
+&lt;li&gt;Invitation to users to explain their use-cases and describe the limitations they have found in current technology&lt;/li&gt;
+&lt;li&gt;Brain-storming session for identifying trends and mapping out strategies to tackle existing choke-points&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;The exact agenda will be published here as things get finalised before the event.&lt;/p&gt;
+&lt;p&gt;All users of RDF and graph databases are welcome to attend. If you are interested, please contact: ldbc AT ac DOT upc DOT edu&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#agenda&#34;&gt;Agenda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#slide&#34;&gt;Slide&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#logistics&#34;&gt;Logistics&lt;/a&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;#date&#34;&gt;Date&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#location&#34;&gt;Location&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#venue&#34;&gt;Venue&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;#getting-there&#34;&gt;Getting there&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h3 id=&#34;agenda&#34;&gt;Agenda&lt;/h3&gt;
+&lt;p&gt;We will start at 9:00 on Monday for a full day, followed by a half a day on Tuesday to allow attendees to travel home on the evening of the 20th.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 1&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;09:00 Welcome (Location: Aula Master)&lt;br&gt;
+09:30 Project overview (Emphasis on task forces?) + Questionnaire results?&lt;br&gt;
+10:30 Coffee break&lt;br&gt;
+11:00 User talks (To gather information for use cases?)&lt;/p&gt;
+&lt;p&gt;13:00 Lunch&lt;/p&gt;
+&lt;p&gt;14:00 User talks (cont.)&lt;br&gt;
+15:00 Use case discussions (based on questionnaire results + consortium proposal + user talks).&lt;br&gt;
+16:00 Task force proposals (consortium)&lt;br&gt;
+17:00 Finish first day&lt;/p&gt;
+&lt;p&gt;20:00 Social dinner&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Day 2&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;10:00 Task force discussion (consortium + TUC)&lt;br&gt;
+11:00 Coffe break&lt;br&gt;
+11:30 Task force discussion (consortium + TUC)&lt;br&gt;
+12:30 Summaries (Task forces, use cases, &amp;hellip;) and actions&lt;/p&gt;
+&lt;p&gt;13:00 Lunch and farewell&lt;/p&gt;
+&lt;p&gt;15:00 LDBC Internal meeting&lt;/p&gt;
+&lt;h3 id=&#34;slide&#34;&gt;Slide&lt;/h3&gt;
+&lt;p&gt;Opening session:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686995.pptx&#34;&gt;CWI – Peter Boncz&lt;/a&gt; – Objectives&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687001.pdf&#34;&gt;UPC – Larri&lt;/a&gt; – Questionnaire&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;User stories:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686998.pdf&#34;&gt;BBC – Jem Rayfield&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;CA Technologies – Victor Muntés&lt;/li&gt;
+&lt;li&gt;Connected Discovery (Open Phacts) – Bryn Williams-Jones&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687003.pptx&#34;&gt;Elsevier – Alan Yagoda&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687000.pptx&#34;&gt;ERA7 Bioinformatics – Eduardo Pareja&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687005.pptx&#34;&gt;Press Association – Jarred McGinnis&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687004.pptx&#34;&gt;RJLee – David Neuer&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686994.pdf&#34;&gt;Yale – Lec Maj&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;p&gt;Benchmark proposals:&lt;/p&gt;
+&lt;ul&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2686991.pdf&#34;&gt;Publishing benchmark proposal – Ontotext – Barry Bishop&lt;/a&gt;&lt;/li&gt;
+&lt;li&gt;&lt;a href=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/2687002.pdf&#34;&gt;Social Network Benchmark Proposal – UPC – Larri&lt;/a&gt;&lt;/li&gt;
+&lt;/ul&gt;
+&lt;h4 id=&#34;logistics&#34;&gt;Logistics&lt;/h4&gt;
+&lt;h5 id=&#34;date&#34;&gt;Date&lt;/h5&gt;
+&lt;p&gt;19th and 20th November 2012&lt;/p&gt;
+&lt;h5 id=&#34;location&#34;&gt;Location&lt;/h5&gt;
+&lt;p&gt;The TUC meeting will be held at “Aula Master” at A3 building located inside the “Campus Nord de la UPC” in Barcelona. The address is:&lt;/p&gt;
+&lt;p&gt;Aula Master&lt;br&gt;
+Edifici A3, Campus Nord UPC&lt;br&gt;
+C. Jordi Girona, 1-3&lt;br&gt;
+08034 Barcelona, Spain&lt;/p&gt;
+&lt;h4 id=&#34;venue&#34;&gt;Venue&lt;/h4&gt;
+&lt;p&gt;To reach the campus, there are several options, including Taxi, &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=c8996f6c-8ad5-4d21-b59b-faf9fceebd80&amp;amp;groupId=10168&#34;&gt;Metro&lt;/a&gt; and &lt;a href=&#34;http://www.tmb.cat/ca/c/document_library/get_file?uuid=5e6af5e2-7677-4ce8-85bb-8e63f2b086f1&amp;amp;groupId=10168&#34;&gt;Bus&lt;/a&gt;.&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933315.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding UPC&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933318.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Finding the meeting room&lt;/strong&gt;&lt;/p&gt;
+&lt;h4 id=&#34;getting-there&#34;&gt;Getting there&lt;/h4&gt;
+&lt;p&gt;&lt;strong&gt;Flying:&lt;/strong&gt; Barcelona airport is situated 12 km from the city. There are several ways of getting from the airport to the centre of Barcelona, the cheapest of which is to take the train located outside just a few minutes walking distance past the parking lots at terminal 2 (there is a free bus between terminal 1 and terminal 2, see this &lt;a href=&#34;http://goo.gl/maps/iJqlj&#34;&gt;map of the airport&lt;/a&gt;). It is possible to buy 10 packs of train tickets which makes it cheaper. Taking the bus to the centre of town is more convenient as they leave directly from terminal 1 and 2, however it is more expensive than the train.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Rail:&lt;/strong&gt; The Renfe commuter train leaves the airport every 30 minutes from 6.13 a.m. to 11.40 p.m. Tickets cost around 3€ and the journey to the centre of Barcelona (Sants or Plaça Catalunya stations) takes 20 minutes.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus:&lt;/strong&gt; The Aerobus leaves the airport every 12 minutes, from 6.00 a.m. to 24.00, Monday to Friday, and from 6.30 a.m. to 24.00 on Saturdays, Sundays and public holidays. Tickets cost 6€ and the journey ends in Plaça Catalunya in the centre of Barcelona.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Taxi:&lt;/strong&gt; From the airport, you can take one of Barcelona&amp;rsquo;s typical black and yellow taxis. Taxis may not take more than four passengers. Unoccupied taxis display a green light and have a clearly visible sign showing LIBRE or LLIURE. The trip to Sants train station costs approximately €16 and trips to other destinations in the city cost approximately €18.&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Train and bus:&lt;/strong&gt; Barcelona has two international train stations: Sants and França. Bus companies have different points of arrival in different parts of the city. You can find detailed information in the following link: &lt;a href=&#34;http://www.barcelona-airport.com/eng/transport_eng.htm&#34;&gt;http://www.barcelona-airport.com/eng/transport_eng.htm&lt;/a&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933316.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;The locations of the airport and the city centre&lt;/strong&gt;&lt;/p&gt;
+&lt;p&gt;&lt;img src=&#34;https://pub-383410a98aef4cb686f0c7601eddd25f.r2.dev/event/first-tuc-meeting/attachments/1671180/1933317.jpg&#34; alt=&#34;&#34;&gt;&lt;/p&gt;
+&lt;p&gt;&lt;strong&gt;Bus map&lt;/strong&gt;&lt;/p&gt;
+</description>
+    </item>
+    
+  </channel>
+</rss>
\ No newline at end of file
diff --git a/tags/workshop/page/1/index.html b/tags/workshop/page/1/index.html
new file mode 100644
index 00000000..ce156337
--- /dev/null
+++ b/tags/workshop/page/1/index.html
@@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html lang="en-us">
+  <head>
+    <title>https://ldbcouncil.org/tags/workshop/</title>
+    <link rel="canonical" href="https://ldbcouncil.org/tags/workshop/">
+    <meta name="robots" content="noindex">
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=https://ldbcouncil.org/tags/workshop/">
+  </head>
+</html>

data set	#nodes	#edges	scale	link	size
cit-Patents	3,774,768	16,518,947	XS	`cit-Patents.tar.zst`	119.1 MB
com-friendster	65,608,366	1,806,067,135	XL	`com-friendster.tar.zst`	6.7 GB
datagen-7_5-fb	633,432	34,185,747	S	`datagen-7_5-fb.tar.zst`	162.3 MB
datagen-7_6-fb	754,147	42,162,988	S	`datagen-7_6-fb.tar.zst`	200.0 MB
datagen-7_7-zf	13,180,508	32,791,267	S	`datagen-7_7-zf.tar.zst`	434.5 MB
datagen-7_8-zf	16,521,886	41,025,255	S	`datagen-7_8-zf.tar.zst`	544.3 MB
datagen-7_9-fb	1,387,587	85,670,523	S	`datagen-7_9-fb.tar.zst`	401.2 MB
datagen-8_0-fb	1,706,561	107,507,376	M	`datagen-8_0-fb.tar.zst`	502.5 MB
datagen-8_1-fb	2,072,117	134,267,822	M	`datagen-8_1-fb.tar.zst`	625.4 MB
datagen-8_2-zf	43,734,497	106,440,188	M	`datagen-8_2-zf.tar.zst`	1.4 GB
datagen-8_3-zf	53,525,014	130,579,909	M	`datagen-8_3-zf.tar.zst`	1.7 GB
datagen-8_4-fb	3,809,084	269,479,177	M	`datagen-8_4-fb.tar.zst`	1.2 GB
datagen-8_5-fb	4,599,739	332,026,902	L	`datagen-8_5-fb.tar.zst`	1.5 GB
datagen-8_6-fb	5,667,674	421,988,619	L	`datagen-8_6-fb.tar.zst`	1.9 GB
datagen-8_7-zf	145,050,709	340,157,363	L	`datagen-8_7-zf.tar.zst`	4.6 GB
datagen-8_8-zf	168,308,893	413,354,288	L	`datagen-8_8-zf.tar.zst`	5.3 GB
datagen-8_9-fb	10,572,901	848,681,908	L	`datagen-8_9-fb.tar.zst`	3.7 GB
datagen-9_0-fb	12,857,671	1,049,527,225	XL	`datagen-9_0-fb.tar.zst`	4.6 GB
datagen-9_1-fb	16,087,483	1,342,158,397	XL	`datagen-9_1-fb.tar.zst`	5.8 GB
datagen-9_2-zf	434,943,376	1,042,340,732	XL	`datagen-9_2-zf.tar.zst`	13.7 GB
datagen-9_3-zf	555,270,053	1,309,998,551	XL	`datagen-9_3-zf.tar.zst`	17.4 GB
datagen-9_4-fb	29,310,565	2,588,948,669	XL	`datagen-9_4-fb.tar.zst`	14.0 GB
datagen-sf3k-fb	33,484,375	2,912,009,743	XL	`datagen-sf3k-fb.tar.zst`	12.7 GB
datagen-sf10k-fb	100,218,750	9,404,822,538	2XL	`datagen-sf10k-fb.tar.zst`	40.5 GB
dota-league	61,170	50,870,313	S	`dota-league.tar.zst`	114.3 MB
graph500-22	2,396,657	64,155,735	S	`graph500-22.tar.zst`	202.4 MB
graph500-23	4,610,222	129,333,677	M	`graph500-23.tar.zst`	410.6 MB
graph500-24	8,870,942	260,379,520	M	`graph500-24.tar.zst`	847.7 MB
graph500-25	17,062,472	523,602,831	L	`graph500-25.tar.zst`	1.7 GB
graph500-26	32,804,978	1,051,922,853	XL	`graph500-26.tar.zst`	3.4 GB
graph500-27	63,081,040	2,111,642,032	XL	`graph500-27.tar.zst`	7.1 GB
graph500-28	121,242,388	4,236,163,958	2XL	`graph500-28.tar.zst`	14.4 GB
graph500-29	232,999,630	8,493,569,115	2XL	`graph500-29.tar.zst`	29.6 GB
graph500-30	447,797,986	17,022,117,362	3XL	`graph500-30.tar.zst`	60.8 GB
kgs	832,247	17,891,698	XS	`kgs.tar.zst`	65.7 MB
twitter_mpi	52,579,678	1,963,263,508	XL	`twitter_mpi.tar.zst`	5.7 GB
wiki-Talk	2,394,385	5,021,410	2XS	`wiki-Talk.tar.zst`	34.9 MB
example-directed	10	17	-	`example-directed.tar.zst`	1.0 KB
example-undirected	9	12	-	`example-undirected.tar.zst`	1.0 KB
test-bfs-directed	<100	<100	-	`test-bfs-directed.tar.zst`	<2.0 KB
test-bfs-undirected	<100	<100	-	`test-bfs-undirected.tar.zst`	<2.0 KB
test-cdlp-directed	<100	<100	-	`test-cdlp-directed.tar.zst`	<2.0 KB
test-cdlp-undirected	<100	<100	-	`test-cdlp-undirected.tar.zst`	<2.0 KB
test-pr-directed	<100	<100	-	`test-pr-directed.tar.zst`	<2.0 KB
test-pr-undirected	<100	<100	-	`test-pr-undirected.tar.zst`	<2.0 KB
test-lcc-directed	<100	<100	-	`test-lcc-directed.tar.zst`	<2.0 KB
test-lcc-undirected	<100	<100	-	`test-lcc-undirected.tar.zst`	<2.0 KB
test-wcc-directed	<100	<100	-	`test-wcc-directed.tar.zst`	<2.0 KB
test-wcc-undirected	<100	<100	-	`test-wcc-undirected.tar.zst`	<2.0 KB
test-sssp-directed	<100	<100	-	`test-sssp-directed.tar.zst`	<2.0 KB
test-sssp-undirected	<100	<100	-	`test-sssp-undirected.tar.zst`	<2.0 KB
Benchmark setup	SF	Hardware	Performance metrics and cost	Documents
+ + System: TuGraph 0.9 + Test sponsor: TuGraph, Ant Yunchuang Digital Technology (Beijing) Co., Ltd. + Date: 2023-12-03 + + + Query language: Gremlin + System cost: 5,649,500 USD + +	30,000	72 Alibaba Cloud ecs.r7.16xlarge instances: 64×Intel Xeon Platinum 8369B vCPUs, 512 GiB RAM per instance	+ + Power@SF: 111,775.39 + Power@SF (price‑adjusted): 19.79 + Throughput@SF: 56,920.48 + Throughput@SF (price‑adjusted): 10.08 + +	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
+ + System: TigerGraph 3.7.0 + Test sponsor: TigerGraph + Date: 2023-04-06 + + + Query language: GSQL + System cost: 142,815 USD + +	100	1 AWS r6a.4xlarge instance: 16×AMD EPYC 7R13 vCPUs, 128GiB RAM	+ + Power@SF: 6,253.72 + Power@SF (price‑adjusted): 43.79 + Throughput@SF: 3,723.44 + Throughput@SF (price‑adjusted): 26.07 + +	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
+ + System: TigerGraph 3.7.0 + Test sponsor: TigerGraph + Date: 2023-04-06 + + + Query language: GSQL + System cost: 1,302,174 USD + +	1,000	4 AWS r6a.8xlarge instances: 32×AMD EPYC 7R13 vCPUs, 256GiB RAM per instance	+ + Power@SF: 23,951.74 + Power@SF (price‑adjusted): 18.39 + Throughput@SF: 10,605.12 + Throughput@SF (price‑adjusted): 8.14 + +	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
+ + System: TigerGraph 3.7.0 + Test sponsor: TigerGraph + Date: 2023-04-06 + + + Query language: GSQL + System cost: 7,871,354 USD + +	10,000	48 AWS r6a.8xlarge instances: 32×AMD EPYC 7R13 vCPUs, 256GiB RAM per instance	+ + Power@SF: 89,444.50 + Power@SF (price‑adjusted): 11.36 + Throughput@SF: 41,025.76 + Throughput@SF (price‑adjusted): 5.21 + +	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
+ + System: TigerGraph 3.7.0 + Test sponsor: TigerGraph + Date: 2022-11-09 + + + Query language: GSQL + System cost: 1,353,315 USD + +	1,000	Dell PowerEdge 6625 with 64×AMD EPYC 9354 CPU cores and 1.5TiB RAM	+ + Power@SF: 30,990.08 + Power@SF (price‑adjusted): 22.90 + Throughput@SF: 12,993.85 + Throughput@SF (price‑adjusted): 9.60 + +	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
Benchmark setup	SF	Hardware	Throughput	Documents
+ + System: GraphDB 10.1.1 + Test sponsor: Ontotext + Date: 2023-01-31 + + + Query language: SPARQL + System cost: 216,222 USD + +	30	AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 1 read thread, 1 write thread	3.04 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	30	AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 2 read threads, 2 write threads	6.76 ops/s
	30	AWS r6id.8xlarge, 256GiB RAM, 32×Intel Xeon Platinum 8375C vCPUs, 4 read threads, 4 write threads	12.16 ops/s
Benchmark setup	SF	Hardware	Throughput	Documents
+ + System: GraphScope Flex 0.26.1 + Test sponsor: Alibaba Cloud + Date: 2024-05-14 + + + Queries implemented in: C++ stored procedures + System cost: 738,724 RMB + +	100	Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs	130,098.36 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	300	Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs	131,263.87 ops/s
	1000	Alibaba Cloud ecs.r8a.16xlarge, 512GiB RAM, 64×AMD EPYC 9T24 @ 3.7GHz vCPUs	127,784.51 ops/s
+ + System: AtlasGraph 3.0.0 + Test sponsor: StarGraph + Date: 2023-12-25 + + + Queries implemented in: Rust stored procedures + System cost: 2,032,461 RMB + +	30	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	37,631.25 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	48,764.08 ops/s
	300	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	48,311.63 ops/s
+ + System: GraphScope Flex 0.23.0 + Test sponsor: Alibaba DAMO Academy + Date: 2023-07-13 + + + Queries implemented in: C++ stored procedures + System cost: 99,236 USD + +	30	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs	33,180.87 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs	33,625.36 ops/s
	300	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8175M vCPUs	33,261.38 ops/s
+ + System: TuGraph 3.3.4 + Test sponsor: Ant Group + Date: 2023-01-28 + + + Queries implemented in: C++ stored procedures + System cost: 277,542 RMB + +	30	Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs	16,133.08 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs	16,966.26 ops/s
	300	Alibaba Cloud ecs.g8y.16xlarge, 256GiB RAM, 64×Arm-based YiTian 710 vCPUs	13,532.62 ops/s
+ + System: TuGraph 3.2.0 + Test sponsor: Ant Group + Date: 2022-08-16 + + + Queries implemented in: C++ stored procedures + System cost: 291,176 USD + +	30	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	12,252.50 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	12,934.61 ops/s
	300	AWS r5d.12xlarge, 384GiB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	12,721.24 ops/s
+ + System: Galaxybase 3.3.0 + Test sponsor: CreateLink + Date: 2022-05-16 + + + Queries implemented in: Java stored procedures + System cost: 263,282 USD + +	30	AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	9,285.86 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	8,501.21 ops/s
	300	AWS r5d.12xlarge, 372GB RAM, 48×Intel Xeon Platinum 8259CL vCPUs	8,370.52 ops/s
+ + System: TuGraph 1.1 + Test sponsor: FMA + Date: 2020-07-26 + + + Queries implemented in: C++ stored procedures + System cost: 280,650 USD + +	30	AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs	5,436.47 ops/s	+ + Full disclosure report + Executive summary + Signatures + Supplementary package + +
	100	AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs	5,010.77 ops/s
	300	AWS r5d.12xlarge, 374GB RAM, 48×Intel Xeon Platinum 8175M vCPUs	4,855.52 ops/s
SF	Throughput	Cost	Software	Hardware	Test Sponsor	Date	Full Disclosure Report
10	101.20 ops/s	30,427 EUR	Sparksee 5.1.1	2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM	Sparsity Technologies SA	2015-04-27	Full Disclosure Report
30	1,287.17 ops/s	20,212 EUR	Virtuoso 07.50.3213 v7fasttrack	2×Xeon2630 6-core 2.4GHz, 192GB RAM	OpenLink Software	2015-04-27	Full Disclosure Report
30	86.50 ops/s	30,427 EUR	Sparksee 5.1.1	2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM	Sparsity Technologies SA	2015-04-27	Full Disclosure Report
100	1,200.00 ops/s	20,212 EUR	Virtuoso 07.50.3213 v7fasttrack	2×Xeon2630 6-core 2.4GHz, 192GB RAM	OpenLink Software	2015-04-27	Full Disclosure Report
100	81.70 ops/s	37,927 EUR	Sparksee 5.1.1	2×Xeon 2630v3 8-core 2.4GHz, 256GB RAM	Sparsity Technologies SA	2015-04-27	Full Disclosure Report
300	635.00 ops/s	20,212 EUR	Virtuoso 07.50.3213 v7fasttrack	2×Xeon2630 6-core 2.4GHz, 192GB RAM	OpenLink Software	2015-04-27	Full Disclosure Report
SF	Triples	RW Agents	Interactive (Q/sec)	Updates (ops/sec)	Cost	Software	Hardware	Test Sponsor	Date	FDR
3	256M	16 / 4	335.48	25.66	177,474 USD	GraphDB EE 10.0.1	AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
3	256M	24 / 0	413.16	0.00	207,474 USD	GraphDB EE 10.0.1	AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
3	256M	64 / 4	1121.76	9.53	652,422 USD	GraphDB EE 10.0.1	3×AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
3	256M	64 / 0	985.63	0.00	562,422 USD	GraphDB EE 10.0.1	3×AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
5	1B	16 / 4	105.76	10.45	177,474 USD	GraphDB EE 10.0.1	AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
5	1B	24 / 0	158.10	0.00	207,474 USD	GraphDB EE 10.0.1	AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
5	1B	64 / 4	372.56	4.04	652,422 USD	GraphDB EE 10.0.1	3×AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
5	1B	64 / 0	408.68	0.00	562,422 USD	GraphDB EE 10.0.1	3×AWS r6id.8xlarge	Ontotext AD	2023-01-29	FDR, summary
1	64M	8 / 2	100.85	10.19	37,504 EUR	GraphDB EE 6.2	Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM	Ontotext AD	2015-04-26	FDR
1	64M	8 / 2	142.76	10.67	35,323 EUR	GraphDB SE 6.3 alpha	Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM	Ontotext AD	2015-06-10	FDR
3	256M	8 / 2	29.90	9.50	37,504 EUR	GraphDB EE 6.2	Intel Xeon E5-1650v3 6×3.5Ghz, 96GB RAM	Ontotext AD	2015-04-26	FDR
3	256M	8 / 2	54.64	9.50	35,323 EUR	GraphDB SE 6.3 alpha	Intel Xeon E5-1650v3 6×3.5GHz, 64GB RAM	Ontotext AD	2015-06-10	FDR
1	64M	22 / 2	149.04	156.83	20,213 USD	Virtuoso v7.50.3213	Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM	OpenLink Software	2015-06-09	FDR
3	256M	22 / 2	80.62	92.71	20,213 USD	Virtuoso v7.50.3213	Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM	OpenLink Software	2015-06-09	FDR
3	256M	30 / 3	115.38	109.85	24,528 USD	Virtuoso v7.50.3213	AWS r3.8xlarge	OpenLink Software	2015-06-09	FDR
5	1B	22 / 2	32.28	72.72	20,213 USD	Virtuoso v7.50.3213	Intel Xeon E5-2630 6×2.30GHz, 192 GB RAM	OpenLink Software	2015-06-09	FDR
5	1B	30 / 3	45.81	55.45	24,528 USD	Virtuoso v7.50.3213	AWS r3.8xlarge	OpenLink Software	2015-06-10	FDR
start	finish	speaker	title
09:20	09:30	Peter Boncz (LDBC/CWI)	State of the union – slides, video
09:30	09:45	Alastair Green (LDBC/Birkbeck)	LDBC’s fair use policies – slides, video
09:50	10:05	Gábor Szárnyas (LDBC/CWI), Jack Waudby (Newcastle University)	LDBC Social Network Benchmark: Business Intelligence workload v1.0 – slides, video
10:10	10:25	Heng Lin (Ant Group)	LDBC Financial Benchmark introduction – slides, video
10:30	11:00	coffee break
11:00	11:15	Chen Zhang (CreateLink)	New LDBC SNB benchmark record by Galaxybase: More than 6 times faster and 70% higher throughput – slides, video
11:20	11:35	James Clarkson (Neo4j)	LDBC benchmarks: Promoting good science and industrial consumption – slides, video
11:40	11:55	Oskar van Rest (Oracle)	Creating and querying property graphs in Oracle, on-premise and in the cloud – slides, video
12:00	12:15	Mingxi Wu (TigerGraph)	Conquering LDBC SNB BI at SF-10k – slides, video
12:20	13:20	lunch (on your own)
13:20	13:35	Altan Birler (Technische Universität München)	Relational databases can handle graphs too! Experiences with optimizing the Umbra RDBMS for LDBC SNB BI – slides, video
13:40	13:55	David Püroja (CWI)	LDBC Social Network Benchmark: Interactive workload v2.0 – slides
14:00	14:15	Angela Bonifati (Lyon 1 University)	The quest for schemas in graph databases – slides, video
14:20	14:35	Matteo Lissandrini (Aalborg University)	Understanding graph data representations in triplestores – slides, video
14:40	14:55	Wim Martens (University of Bayreuth)	Path representations – slides, video
15:00	15:20	Audrey Cheng (UC Berkeley)	TAOBench: An end-to-end benchmark for social network workloads – slides, video
start	finish	speaker	title
10:00	10:15	Keith Hare (WG3)	An update on the GQL & SQL/PGQ standards efforts – slides, video
10:20	10:35	Leonid Libkin (ENS Paris)	Pattern matching in GQL and SQL/PGQ – slides, video
10:40	10:55	Petra Selmer (Neo4j/WG3)	An overview of GQL – slides, video
11:00	11:15	Alastair Green (LDBC/WG3)	GQL 2.0: A technical manifesto – slides, video
11:20	11:35	George Fletcher (TU Eindhoven)	PG-Keys (LDBC Property Graph Schema Working Group) – slides, video
11:40	11:55	Arvind Shyamsundar (Microsoft)	Graph capabilities in Microsoft SQL Server and Azure SQL Database – slides, video
12:00	13:30	lunch (on your own)
13:30	13:45	Daniël ten Wolde (CWI)	Implementing SQL/PGQ in DuckDB – slides, video
13:50	14:05	Oszkár Semeráth, Kristóf Marussy (TU Budapest)	Generation techniques for consistent, realistic, diverse, and scalable graphs – slides, video
14:10	14:25	Molham Aref (RelationalAI)	Graph Normal Form – slides, video
14:30	14:45	Naomi Arnold (Queen Mary University of London)	Temporal graph analysis of the far-right social network Gab – slides, video
14:50	15:05	Domagoj Vrgoč (PUC Chile)	Evaluating path queries in MillenniumDB – slides, video
15:10	15:25	Pavel Klinov, Evren Sirin (Stardog)	Stardog’s experience with LDBC – slides, video
start	speaker	title
16:00	Peter Boncz (CWI)	State of the union – slides
16:05	Gábor Szárnyas (CWI)	Overview of LDBC benchmarks – slides
16:12	Mingxi Wu (TigerGraph)	LDBC Social Network Benchmark results with TigerGraph – slides
16:24	Xiaowei Zhu (Ant Group)	Financial Benchmark proposal – slides
16:36	Petra Selmer (Neo4j)	Status report from the Existing Languages Working Group (ELWG) – slides, video
16:48	Jan Hidders (Birkbeck)	Status report from the Property Graph Schema Working Group (PGSWG) – slides, video
17:00	Keith Hare (JCC Consulting)	Database Language Standards Structure and Process, SQL/PGQ – slides, video
17:12	Stefan Plantikow (GQL Editor)	Report on the GQL standard – slides, video
start	speaker	title
17:35	Vasileios Trigonakis (Oracle Labs)	PGX.D aDFS: An Almost Depth-First-Search Distributed Graph-Querying System – slides, video
17:47	Matthias Hauck (SAP)	JSON, Spatial, Graph – Multi-model Workloads with SAP HANA Cloud – slides, video
17:59	Nikolay Yakovets (Eindhoven University of Technology)	AvantGraph – slides, video
18:11	Semih Salihoglu (University of Waterloo)	GRainDB: Making RDBMSs Efficient on Graph Workloads Through Predefined Joins – slides, video
18:23	Semyon Grigorev (Saint Petersburg University)	Context-free path querying: Obstacles on the way to adoption – slides, video
18:35	Per Fuchs (Technical University of Munich)	Sortledton: A universal, transactional graph data structure – slides, video